{ "epoch": 3.0, "num_input_tokens_seen": 122880000, "total_flos": 1.580945522688e+16, "train_loss": 0.10143799341519674, "train_runtime": 4258.2582, "train_samples": 320000, "train_samples_per_second": 225.444, "train_steps_per_second": 28.181, "train_tokens_per_second": 28856.869 }