{ | |
"checkpoint": "ckpt_118.pt", | |
"model": "GPT2-L", | |
"training_step": 40000, | |
"instability_type": "Recoverable loss spikes", | |
"learning_rate": "1e-3", | |
"decay": "0.1", | |
"warm": "0", | |
"data_type": "BF16", | |
"reproducibility": true | |
} |
{ | |
"checkpoint": "ckpt_118.pt", | |
"model": "GPT2-L", | |
"training_step": 40000, | |
"instability_type": "Recoverable loss spikes", | |
"learning_rate": "1e-3", | |
"decay": "0.1", | |
"warm": "0", | |
"data_type": "BF16", | |
"reproducibility": true | |
} |