{ "epoch": 9.716417910447761, "eval_loss": 1.0977526903152466, "eval_runtime": 1.7342, "eval_samples_per_second": 1054.072, "eval_steps_per_second": 16.722, "perplexity": 2.9974223129878887, "total_flos": 5406457244811264.0, "train_loss": 1.8237198396162553, "train_runtime": 182.316, "train_samples_per_second": 467.759, "train_steps_per_second": 1.81 }