{ "epoch": 3.0, "eval_loss": 0.09235269576311111, "eval_mse": 0.09235269895339973, "eval_runtime": 9.5082, "eval_samples": 10000, "eval_samples_per_second": 1051.725, "eval_steps_per_second": 131.466, "num_input_tokens_seen": 34560000, "total_flos": 4446488701440000.0, "train_loss": 0.08211795973601164, "train_runtime": 1433.1905, "train_samples": 90000, "train_samples_per_second": 188.391, "train_steps_per_second": 23.549, "train_tokens_per_second": 24114.032 }