{ | |
"epoch": 2.995008319467554, | |
"eval_accuracy": 0.5815950446091447, | |
"eval_loss": 0.9033203125, | |
"eval_runtime": 984.991, | |
"eval_samples": 921, | |
"eval_samples_per_second": 0.935, | |
"eval_steps_per_second": 0.235, | |
"perplexity": 2.4677833350465583, | |
"total_flos": 116490238033920.0, | |
"train_loss": 0.36549280296873166, | |
"train_runtime": 96569.5267, | |
"train_samples": 7211, | |
"train_samples_per_second": 0.224, | |
"train_steps_per_second": 0.007 | |
} |