qwen2.5-1.5b-sft3-25-3 / all_results.json
hZzy's picture
End of training
9807c7a verified
{
"epoch": 9.75609756097561,
"eval_loss": 2.1613569259643555,
"eval_runtime": 18.8811,
"eval_samples": 4988,
"eval_samples_per_second": 39.087,
"eval_steps_per_second": 1.006,
"total_flos": 1.742036445167616e+16,
"train_loss": 2.3644245743751524,
"train_runtime": 7118.2054,
"train_samples": 43233,
"train_samples_per_second": 9.167,
"train_steps_per_second": 0.028
}