{"current_steps": 5, "total_steps": 192, "loss": 4.5817, "lr": 4.991638098272951e-05, "epoch": 0.20833333333333334, "percentage": 2.6, "elapsed_time": "0:03:37", "remaining_time": "2:15:48", "throughput": 323.11, "total_tokens": 70400} {"current_steps": 10, "total_steps": 192, "loss": 0.4906, "lr": 4.966608330212198e-05, "epoch": 0.4166666666666667, "percentage": 5.21, "elapsed_time": "0:07:07", "remaining_time": "2:09:31", "throughput": 333.23, "total_tokens": 142296} {"current_steps": 15, "total_steps": 192, "loss": 0.5919, "lr": 4.9250781329863606e-05, "epoch": 0.625, "percentage": 7.81, "elapsed_time": "0:10:36", "remaining_time": "2:05:06", "throughput": 338.33, "total_tokens": 215224} {"current_steps": 20, "total_steps": 192, "loss": 0.3977, "lr": 4.867325323737765e-05, "epoch": 0.8333333333333334, "percentage": 10.42, "elapsed_time": "0:14:04", "remaining_time": "2:01:06", "throughput": 337.95, "total_tokens": 285568} {"current_steps": 25, "total_steps": 192, "loss": 0.4036, "lr": 4.793736241118728e-05, "epoch": 1.0416666666666667, "percentage": 13.02, "elapsed_time": "0:17:34", "remaining_time": "1:57:24", "throughput": 339.45, "total_tokens": 357968} {"current_steps": 30, "total_steps": 192, "loss": 0.3966, "lr": 4.7048031608708876e-05, "epoch": 1.25, "percentage": 15.62, "elapsed_time": "0:21:11", "remaining_time": "1:54:24", "throughput": 337.37, "total_tokens": 428848} {"current_steps": 35, "total_steps": 192, "loss": 0.3386, "lr": 4.601121002736095e-05, "epoch": 1.4583333333333333, "percentage": 18.23, "elapsed_time": "0:24:47", "remaining_time": "1:51:13", "throughput": 336.46, "total_tokens": 500536} {"current_steps": 40, "total_steps": 192, "loss": 0.3656, "lr": 4.4833833507280884e-05, "epoch": 1.6666666666666665, "percentage": 20.83, "elapsed_time": "0:28:23", "remaining_time": "1:47:53", "throughput": 336.17, "total_tokens": 572648} {"current_steps": 45, "total_steps": 192, "loss": 0.3556, "lr": 4.352377813387398e-05, "epoch": 1.875, "percentage": 23.44, "elapsed_time": "0:31:59", "remaining_time": "1:44:28", "throughput": 335.38, "total_tokens": 643624} {"current_steps": 50, "total_steps": 192, "loss": 0.2927, "lr": 4.208980755057178e-05, "epoch": 2.0833333333333335, "percentage": 26.04, "elapsed_time": "0:35:34", "remaining_time": "1:41:01", "throughput": 335.22, "total_tokens": 715504} {"current_steps": 55, "total_steps": 192, "loss": 0.2644, "lr": 4.054151433425194e-05, "epoch": 2.2916666666666665, "percentage": 28.65, "elapsed_time": "0:39:06", "remaining_time": "1:37:24", "throughput": 335.15, "total_tokens": 786328} {"current_steps": 60, "total_steps": 192, "loss": 0.2624, "lr": 3.888925582549006e-05, "epoch": 2.5, "percentage": 31.25, "elapsed_time": "0:42:34", "remaining_time": "1:33:40", "throughput": 335.39, "total_tokens": 856784} {"current_steps": 65, "total_steps": 192, "loss": 0.2458, "lr": 3.7144084842908505e-05, "epoch": 2.7083333333333335, "percentage": 33.85, "elapsed_time": "0:46:03", "remaining_time": "1:29:58", "throughput": 336.5, "total_tokens": 929768} {"current_steps": 70, "total_steps": 192, "loss": 0.2809, "lr": 3.5317675745109866e-05, "epoch": 2.9166666666666665, "percentage": 36.46, "elapsed_time": "0:49:31", "remaining_time": "1:26:18", "throughput": 336.97, "total_tokens": 1001312} {"current_steps": 75, "total_steps": 192, "loss": 0.2873, "lr": 3.34222463348055e-05, "epoch": 3.125, "percentage": 39.06, "elapsed_time": "0:53:00", "remaining_time": "1:22:41", "throughput": 337.68, "total_tokens": 1074016} {"current_steps": 80, "total_steps": 192, "loss": 0.2201, "lr": 3.147047612756302e-05, "epoch": 3.3333333333333335, "percentage": 41.67, "elapsed_time": "0:56:29", "remaining_time": "1:19:04", "throughput": 337.6, "total_tokens": 1144184} {"current_steps": 85, "total_steps": 192, "loss": 0.1891, "lr": 2.9475421531915827e-05, "epoch": 3.5416666666666665, "percentage": 44.27, "elapsed_time": "0:59:57", "remaining_time": "1:15:28", "throughput": 337.91, "total_tokens": 1215680} {"current_steps": 90, "total_steps": 192, "loss": 0.1966, "lr": 2.7450428508239024e-05, "epoch": 3.75, "percentage": 46.88, "elapsed_time": "1:03:26", "remaining_time": "1:11:53", "throughput": 338.37, "total_tokens": 1287848} {"current_steps": 95, "total_steps": 192, "loss": 0.1773, "lr": 2.5409043290662173e-05, "epoch": 3.9583333333333335, "percentage": 49.48, "elapsed_time": "1:06:53", "remaining_time": "1:08:18", "throughput": 338.62, "total_tokens": 1359184} {"current_steps": 100, "total_steps": 192, "loss": 0.1521, "lr": 2.3364921769246423e-05, "epoch": 4.166666666666667, "percentage": 52.08, "elapsed_time": "1:10:21", "remaining_time": "1:04:43", "throughput": 339.17, "total_tokens": 1431816} {"current_steps": 100, "total_steps": 192, "eval_loss": 0.3628197908401489, "epoch": 4.166666666666667, "percentage": 52.08, "elapsed_time": "1:12:10", "remaining_time": "1:06:24", "throughput": 330.63, "total_tokens": 1431816} {"current_steps": 105, "total_steps": 192, "loss": 0.0969, "lr": 2.1331738138615958e-05, "epoch": 4.375, "percentage": 54.69, "elapsed_time": "1:17:07", "remaining_time": "1:03:54", "throughput": 325.01, "total_tokens": 1503912} {"current_steps": 110, "total_steps": 192, "loss": 0.1199, "lr": 1.932309342414067e-05, "epoch": 4.583333333333333, "percentage": 57.29, "elapsed_time": "1:20:34", "remaining_time": "1:00:03", "throughput": 325.98, "total_tokens": 1575912} {"current_steps": 115, "total_steps": 192, "loss": 0.1323, "lr": 1.7352424497586163e-05, "epoch": 4.791666666666667, "percentage": 59.9, "elapsed_time": "1:24:01", "remaining_time": "0:56:15", "throughput": 326.51, "total_tokens": 1646056} {"current_steps": 120, "total_steps": 192, "loss": 0.1403, "lr": 1.5432914190872757e-05, "epoch": 5.0, "percentage": 62.5, "elapsed_time": "1:27:28", "remaining_time": "0:52:29", "throughput": 327.24, "total_tokens": 1717560} {"current_steps": 125, "total_steps": 192, "loss": 0.1139, "lr": 1.3577403109239484e-05, "epoch": 5.208333333333333, "percentage": 65.1, "elapsed_time": "1:31:02", "remaining_time": "0:48:47", "throughput": 327.58, "total_tokens": 1789304} {"current_steps": 130, "total_steps": 192, "loss": 0.0935, "lr": 1.1798303733740802e-05, "epoch": 5.416666666666667, "percentage": 67.71, "elapsed_time": "1:34:38", "remaining_time": "0:45:08", "throughput": 327.48, "total_tokens": 1859552} {"current_steps": 135, "total_steps": 192, "loss": 0.0502, "lr": 1.0107517387689166e-05, "epoch": 5.625, "percentage": 70.31, "elapsed_time": "1:38:11", "remaining_time": "0:41:27", "throughput": 327.8, "total_tokens": 1931216} {"current_steps": 140, "total_steps": 192, "loss": 0.043, "lr": 8.51635462249828e-06, "epoch": 5.833333333333333, "percentage": 72.92, "elapsed_time": "1:41:42", "remaining_time": "0:37:46", "throughput": 328.38, "total_tokens": 2003784} {"current_steps": 145, "total_steps": 192, "loss": 0.0432, "lr": 7.035459555507548e-06, "epoch": 6.041666666666667, "percentage": 75.52, "elapsed_time": "1:45:12", "remaining_time": "0:34:06", "throughput": 328.81, "total_tokens": 2075648} {"current_steps": 150, "total_steps": 192, "loss": 0.0336, "lr": 5.674738665931575e-06, "epoch": 6.25, "percentage": 78.12, "elapsed_time": "1:48:43", "remaining_time": "0:30:26", "throughput": 329.18, "total_tokens": 2147344} {"current_steps": 155, "total_steps": 192, "loss": 0.0189, "lr": 4.4432945252556284e-06, "epoch": 6.458333333333333, "percentage": 80.73, "elapsed_time": "1:52:13", "remaining_time": "0:26:47", "throughput": 329.52, "total_tokens": 2218968} {"current_steps": 160, "total_steps": 192, "loss": 0.0344, "lr": 3.3493649053890326e-06, "epoch": 6.666666666666667, "percentage": 83.33, "elapsed_time": "1:55:44", "remaining_time": "0:23:08", "throughput": 329.81, "total_tokens": 2290400} {"current_steps": 165, "total_steps": 192, "loss": 0.0112, "lr": 2.4002676719139166e-06, "epoch": 6.875, "percentage": 85.94, "elapsed_time": "1:59:15", "remaining_time": "0:19:30", "throughput": 330.13, "total_tokens": 2362184} {"current_steps": 170, "total_steps": 192, "loss": 0.0071, "lr": 1.6023518310668618e-06, "epoch": 7.083333333333333, "percentage": 88.54, "elapsed_time": "2:02:45", "remaining_time": "0:15:53", "throughput": 330.25, "total_tokens": 2432600} {"current_steps": 175, "total_steps": 192, "loss": 0.0239, "lr": 9.609550579259496e-07, "epoch": 7.291666666666667, "percentage": 91.15, "elapsed_time": "2:06:16", "remaining_time": "0:12:16", "throughput": 330.37, "total_tokens": 2503072} {"current_steps": 180, "total_steps": 192, "loss": 0.0051, "lr": 4.803679899192392e-07, "epoch": 7.5, "percentage": 93.75, "elapsed_time": "2:09:46", "remaining_time": "0:08:39", "throughput": 330.7, "total_tokens": 2575144} {"current_steps": 185, "total_steps": 192, "loss": 0.0197, "lr": 1.6380552451389086e-07, "epoch": 7.708333333333333, "percentage": 96.35, "elapsed_time": "2:13:17", "remaining_time": "0:05:02", "throughput": 330.96, "total_tokens": 2646888} {"current_steps": 190, "total_steps": 192, "loss": 0.0048, "lr": 1.3385313090857887e-08, "epoch": 7.916666666666667, "percentage": 98.96, "elapsed_time": "2:16:45", "remaining_time": "0:01:26", "throughput": 331.39, "total_tokens": 2719168} {"current_steps": 192, "total_steps": 192, "epoch": 8.0, "percentage": 100.0, "elapsed_time": "2:19:52", "remaining_time": "0:00:00", "throughput": 327.46, "total_tokens": 2748096}