|
{ |
|
"epoch": 3.0, |
|
"eval_accuracy": 0.951525, |
|
"eval_combined_score": 1.3493705490187269, |
|
"eval_loss": 0.198301300406456, |
|
"eval_runtime": 39.4383, |
|
"eval_samples": 80000, |
|
"eval_samples_per_second": 2028.484, |
|
"eval_steps_per_second": 253.56, |
|
"num_input_tokens_seen": 122880000, |
|
"total_flos": 1.580945522688e+16, |
|
"train_loss": 0.10143799341519674, |
|
"train_runtime": 4258.2582, |
|
"train_samples": 320000, |
|
"train_samples_per_second": 225.444, |
|
"train_steps_per_second": 28.181, |
|
"train_tokens_per_second": 28856.869 |
|
} |