InstabilityZoo / metadata /ckpt_109.json
lxe5wipauser17
gpt2-medium
dea19e4
{
"checkpoint": "ckpt_109.pt",
"model": "GPT2-M",
"training_step": 76000,
"instability_type": "Recoverable loss spikes",
"learning_rate": "3e-3",
"decay": "0.1",
"warm": "2000",
"data_type": "BF16",
"reproducibility": false
}