{ "epoch": 3.0, "eval_loss": 0.803139865398407, "eval_runtime": 137.774, "eval_samples": 134, "eval_samples_per_second": 0.973, "eval_steps_per_second": 0.123, "perplexity": 2.232539809468662, "train_loss": 0.9154848974025481, "train_runtime": 4986.1228, "train_samples": 446, "train_samples_per_second": 0.268, "train_steps_per_second": 0.134 }