{ "checkpoint": "ckpt_14.pt", "model": "GPT2-S", "training_step": 4000, "instability_type": "complete non-convergence", "learning_rate": "1e-2", "decay": "0.1", "warm": "0", "data_type": "BF16" }