{"current_steps": 1, "total_steps": 1080, "loss": 0.6713, "lr": 4.999989423013716e-05, "epoch": 0.01834862385321101, "percentage": 0.09, "elapsed_time": "0:00:21", "remaining_time": "6:29:52", "throughput": 2035.78, "total_tokens": 44136} {"current_steps": 2, "total_steps": 1080, "loss": 0.533, "lr": 4.999957692144361e-05, "epoch": 0.03669724770642202, "percentage": 0.19, "elapsed_time": "0:00:38", "remaining_time": "5:44:44", "throughput": 2165.29, "total_tokens": 83096} {"current_steps": 3, "total_steps": 1080, "loss": 0.6048, "lr": 4.999904807660428e-05, "epoch": 0.05504587155963303, "percentage": 0.28, "elapsed_time": "0:00:54", "remaining_time": "5:23:37", "throughput": 2257.64, "total_tokens": 122112} {"current_steps": 4, "total_steps": 1080, "loss": 0.4948, "lr": 4.999830770009406e-05, "epoch": 0.07339449541284404, "percentage": 0.37, "elapsed_time": "0:01:10", "remaining_time": "5:15:31", "throughput": 2316.97, "total_tokens": 163064} {"current_steps": 5, "total_steps": 1080, "loss": 0.6607, "lr": 4.999735579817769e-05, "epoch": 0.09174311926605505, "percentage": 0.46, "elapsed_time": "0:01:29", "remaining_time": "5:19:42", "throughput": 2284.28, "total_tokens": 203808} {"current_steps": 6, "total_steps": 1080, "loss": 0.5802, "lr": 4.9996192378909786e-05, "epoch": 0.11009174311926606, "percentage": 0.56, "elapsed_time": "0:01:45", "remaining_time": "5:15:08", "throughput": 2289.22, "total_tokens": 241824} {"current_steps": 7, "total_steps": 1080, "loss": 0.5148, "lr": 4.999481745213471e-05, "epoch": 0.12844036697247707, "percentage": 0.65, "elapsed_time": "0:02:04", "remaining_time": "5:17:48", "throughput": 2312.04, "total_tokens": 287608} {"current_steps": 8, "total_steps": 1080, "loss": 0.5714, "lr": 4.9993231029486544e-05, "epoch": 0.14678899082568808, "percentage": 0.74, "elapsed_time": "0:02:19", "remaining_time": "5:12:13", "throughput": 2327.0, "total_tokens": 325320} {"current_steps": 9, "total_steps": 1080, "loss": 0.6812, "lr": 4.999143312438893e-05, "epoch": 0.1651376146788991, "percentage": 0.83, "elapsed_time": "0:02:41", "remaining_time": "5:20:10", "throughput": 2291.07, "total_tokens": 369848} {"current_steps": 10, "total_steps": 1080, "loss": 0.5358, "lr": 4.998942375205502e-05, "epoch": 0.1834862385321101, "percentage": 0.93, "elapsed_time": "0:03:00", "remaining_time": "5:21:42", "throughput": 2301.07, "total_tokens": 415104} {"current_steps": 11, "total_steps": 1080, "loss": 0.6527, "lr": 4.9987202929487275e-05, "epoch": 0.2018348623853211, "percentage": 1.02, "elapsed_time": "0:03:20", "remaining_time": "5:24:18", "throughput": 2333.48, "total_tokens": 467224} {"current_steps": 12, "total_steps": 1080, "loss": 0.5354, "lr": 4.99847706754774e-05, "epoch": 0.22018348623853212, "percentage": 1.11, "elapsed_time": "0:03:37", "remaining_time": "5:22:50", "throughput": 2310.28, "total_tokens": 502824} {"current_steps": 13, "total_steps": 1080, "loss": 0.5263, "lr": 4.998212701060612e-05, "epoch": 0.23853211009174313, "percentage": 1.2, "elapsed_time": "0:03:54", "remaining_time": "5:20:38", "throughput": 2324.0, "total_tokens": 544744} {"current_steps": 14, "total_steps": 1080, "loss": 0.5536, "lr": 4.997927195724303e-05, "epoch": 0.25688073394495414, "percentage": 1.3, "elapsed_time": "0:04:12", "remaining_time": "5:20:49", "throughput": 2338.23, "total_tokens": 591136} {"current_steps": 15, "total_steps": 1080, "loss": 0.6106, "lr": 4.997620553954645e-05, "epoch": 0.27522935779816515, "percentage": 1.39, "elapsed_time": "0:04:29", "remaining_time": "5:19:28", "throughput": 2332.23, "total_tokens": 629664} {"current_steps": 16, "total_steps": 1080, "loss": 0.5129, "lr": 4.997292778346312e-05, "epoch": 0.29357798165137616, "percentage": 1.48, "elapsed_time": "0:04:43", "remaining_time": "5:14:17", "throughput": 2339.41, "total_tokens": 663392} {"current_steps": 17, "total_steps": 1080, "loss": 0.6377, "lr": 4.996943871672807e-05, "epoch": 0.3119266055045872, "percentage": 1.57, "elapsed_time": "0:04:56", "remaining_time": "5:09:29", "throughput": 2351.55, "total_tokens": 698360} {"current_steps": 18, "total_steps": 1080, "loss": 0.4083, "lr": 4.996573836886435e-05, "epoch": 0.3302752293577982, "percentage": 1.67, "elapsed_time": "0:05:14", "remaining_time": "5:08:50", "throughput": 2348.27, "total_tokens": 737520} {"current_steps": 19, "total_steps": 1080, "loss": 0.6086, "lr": 4.9961826771182784e-05, "epoch": 0.3486238532110092, "percentage": 1.76, "elapsed_time": "0:05:27", "remaining_time": "5:04:22", "throughput": 2348.56, "total_tokens": 768056} {"current_steps": 20, "total_steps": 1080, "loss": 0.4591, "lr": 4.995770395678171e-05, "epoch": 0.3669724770642202, "percentage": 1.85, "elapsed_time": "0:05:44", "remaining_time": "5:04:20", "throughput": 2340.06, "total_tokens": 806256} {"current_steps": 21, "total_steps": 1080, "loss": 0.3731, "lr": 4.9953369960546676e-05, "epoch": 0.3853211009174312, "percentage": 1.94, "elapsed_time": "0:06:00", "remaining_time": "5:02:35", "throughput": 2339.7, "total_tokens": 842336} {"current_steps": 22, "total_steps": 1080, "loss": 0.6243, "lr": 4.9948824819150185e-05, "epoch": 0.4036697247706422, "percentage": 2.04, "elapsed_time": "0:06:15", "remaining_time": "5:00:51", "throughput": 2335.49, "total_tokens": 876672} {"current_steps": 23, "total_steps": 1080, "loss": 0.5788, "lr": 4.994406857105136e-05, "epoch": 0.42201834862385323, "percentage": 2.13, "elapsed_time": "0:06:33", "remaining_time": "5:01:14", "throughput": 2326.96, "total_tokens": 915192} {"current_steps": 24, "total_steps": 1080, "loss": 0.4753, "lr": 4.993910125649561e-05, "epoch": 0.44036697247706424, "percentage": 2.22, "elapsed_time": "0:06:49", "remaining_time": "5:00:07", "throughput": 2325.87, "total_tokens": 951904} {"current_steps": 25, "total_steps": 1080, "loss": 0.4518, "lr": 4.993392291751431e-05, "epoch": 0.45871559633027525, "percentage": 2.31, "elapsed_time": "0:07:08", "remaining_time": "5:01:38", "throughput": 2335.97, "total_tokens": 1001816} {"current_steps": 26, "total_steps": 1080, "loss": 0.5638, "lr": 4.992853359792444e-05, "epoch": 0.47706422018348627, "percentage": 2.41, "elapsed_time": "0:07:31", "remaining_time": "5:04:56", "throughput": 2333.16, "total_tokens": 1053064} {"current_steps": 27, "total_steps": 1080, "loss": 0.4644, "lr": 4.99229333433282e-05, "epoch": 0.4954128440366973, "percentage": 2.5, "elapsed_time": "0:07:45", "remaining_time": "5:02:22", "throughput": 2335.97, "total_tokens": 1086688} {"current_steps": 28, "total_steps": 1080, "loss": 0.6191, "lr": 4.9917122201112656e-05, "epoch": 0.5137614678899083, "percentage": 2.59, "elapsed_time": "0:08:05", "remaining_time": "5:03:51", "throughput": 2338.67, "total_tokens": 1134824} {"current_steps": 29, "total_steps": 1080, "loss": 0.6752, "lr": 4.9911100220449293e-05, "epoch": 0.5321100917431193, "percentage": 2.69, "elapsed_time": "0:08:21", "remaining_time": "5:02:53", "throughput": 2337.36, "total_tokens": 1172072} {"current_steps": 30, "total_steps": 1080, "loss": 0.3587, "lr": 4.990486745229364e-05, "epoch": 0.5504587155963303, "percentage": 2.78, "elapsed_time": "0:08:37", "remaining_time": "5:02:02", "throughput": 2338.95, "total_tokens": 1211096} {"current_steps": 31, "total_steps": 1080, "loss": 0.459, "lr": 4.989842394938482e-05, "epoch": 0.5688073394495413, "percentage": 2.87, "elapsed_time": "0:08:57", "remaining_time": "5:03:20", "throughput": 2341.57, "total_tokens": 1259456} {"current_steps": 32, "total_steps": 1080, "loss": 0.4148, "lr": 4.989176976624511e-05, "epoch": 0.5871559633027523, "percentage": 2.96, "elapsed_time": "0:09:19", "remaining_time": "5:05:31", "throughput": 2334.95, "total_tokens": 1306944} {"current_steps": 33, "total_steps": 1080, "loss": 0.539, "lr": 4.988490495917947e-05, "epoch": 0.6055045871559633, "percentage": 3.06, "elapsed_time": "0:09:42", "remaining_time": "5:07:48", "throughput": 2325.65, "total_tokens": 1353744} {"current_steps": 34, "total_steps": 1080, "loss": 0.5453, "lr": 4.987782958627508e-05, "epoch": 0.6238532110091743, "percentage": 3.15, "elapsed_time": "0:10:00", "remaining_time": "5:07:45", "throughput": 2323.72, "total_tokens": 1394736} {"current_steps": 35, "total_steps": 1080, "loss": 0.468, "lr": 4.987054370740083e-05, "epoch": 0.6422018348623854, "percentage": 3.24, "elapsed_time": "0:10:21", "remaining_time": "5:09:18", "throughput": 2319.93, "total_tokens": 1442048} {"current_steps": 36, "total_steps": 1080, "loss": 0.4078, "lr": 4.9863047384206835e-05, "epoch": 0.6605504587155964, "percentage": 3.33, "elapsed_time": "0:10:37", "remaining_time": "5:08:16", "throughput": 2318.0, "total_tokens": 1478440} {"current_steps": 37, "total_steps": 1080, "loss": 0.5299, "lr": 4.9855340680123905e-05, "epoch": 0.6788990825688074, "percentage": 3.43, "elapsed_time": "0:10:57", "remaining_time": "5:09:04", "throughput": 2319.69, "total_tokens": 1525992} {"current_steps": 38, "total_steps": 1080, "loss": 0.439, "lr": 4.9847423660363e-05, "epoch": 0.6972477064220184, "percentage": 3.52, "elapsed_time": "0:11:09", "remaining_time": "5:06:07", "throughput": 2322.37, "total_tokens": 1555608} {"current_steps": 39, "total_steps": 1080, "loss": 0.5337, "lr": 4.983929639191469e-05, "epoch": 0.7155963302752294, "percentage": 3.61, "elapsed_time": "0:11:27", "remaining_time": "5:06:01", "throughput": 2322.14, "total_tokens": 1597392} {"current_steps": 40, "total_steps": 1080, "loss": 0.4536, "lr": 4.983095894354858e-05, "epoch": 0.7339449541284404, "percentage": 3.7, "elapsed_time": "0:11:53", "remaining_time": "5:09:09", "throughput": 2312.22, "total_tokens": 1649656} {"current_steps": 41, "total_steps": 1080, "loss": 0.5221, "lr": 4.982241138581273e-05, "epoch": 0.7522935779816514, "percentage": 3.8, "elapsed_time": "0:12:13", "remaining_time": "5:09:47", "throughput": 2312.16, "total_tokens": 1695952} {"current_steps": 42, "total_steps": 1080, "loss": 0.4279, "lr": 4.9813653791033057e-05, "epoch": 0.7706422018348624, "percentage": 3.89, "elapsed_time": "0:12:31", "remaining_time": "5:09:31", "throughput": 2311.77, "total_tokens": 1737224} {"current_steps": 43, "total_steps": 1080, "loss": 0.5121, "lr": 4.980468623331273e-05, "epoch": 0.7889908256880734, "percentage": 3.98, "elapsed_time": "0:12:44", "remaining_time": "5:07:27", "throughput": 2316.98, "total_tokens": 1772320} {"current_steps": 44, "total_steps": 1080, "loss": 0.54, "lr": 4.979550878853154e-05, "epoch": 0.8073394495412844, "percentage": 4.07, "elapsed_time": "0:13:05", "remaining_time": "5:08:15", "throughput": 2321.91, "total_tokens": 1823888} {"current_steps": 45, "total_steps": 1080, "loss": 0.4488, "lr": 4.9786121534345265e-05, "epoch": 0.8256880733944955, "percentage": 4.17, "elapsed_time": "0:13:27", "remaining_time": "5:09:36", "throughput": 2318.43, "total_tokens": 1872488} {"current_steps": 46, "total_steps": 1080, "loss": 0.4353, "lr": 4.9776524550184965e-05, "epoch": 0.8440366972477065, "percentage": 4.26, "elapsed_time": "0:13:49", "remaining_time": "5:10:44", "throughput": 2320.52, "total_tokens": 1924744} {"current_steps": 47, "total_steps": 1080, "loss": 0.4784, "lr": 4.97667179172564e-05, "epoch": 0.8623853211009175, "percentage": 4.35, "elapsed_time": "0:14:02", "remaining_time": "5:08:45", "throughput": 2325.26, "total_tokens": 1959936} {"current_steps": 48, "total_steps": 1080, "loss": 0.3586, "lr": 4.975670171853926e-05, "epoch": 0.8807339449541285, "percentage": 4.44, "elapsed_time": "0:14:22", "remaining_time": "5:09:03", "throughput": 2323.37, "total_tokens": 2003896} {"current_steps": 49, "total_steps": 1080, "loss": 0.4451, "lr": 4.9746476038786496e-05, "epoch": 0.8990825688073395, "percentage": 4.54, "elapsed_time": "0:14:39", "remaining_time": "5:08:35", "throughput": 2326.95, "total_tokens": 2047632} {"current_steps": 50, "total_steps": 1080, "loss": 0.3591, "lr": 4.973604096452361e-05, "epoch": 0.9174311926605505, "percentage": 4.63, "elapsed_time": "0:15:01", "remaining_time": "5:09:29", "throughput": 2326.25, "total_tokens": 2096928} {"current_steps": 51, "total_steps": 1080, "loss": 0.3415, "lr": 4.9725396584047925e-05, "epoch": 0.9357798165137615, "percentage": 4.72, "elapsed_time": "0:15:15", "remaining_time": "5:07:41", "throughput": 2327.32, "total_tokens": 2129536} {"current_steps": 52, "total_steps": 1080, "loss": 0.3758, "lr": 4.971454298742779e-05, "epoch": 0.9541284403669725, "percentage": 4.81, "elapsed_time": "0:15:29", "remaining_time": "5:06:21", "throughput": 2332.89, "total_tokens": 2169144} {"current_steps": 53, "total_steps": 1080, "loss": 0.485, "lr": 4.97034802665019e-05, "epoch": 0.9724770642201835, "percentage": 4.91, "elapsed_time": "0:15:45", "remaining_time": "5:05:27", "throughput": 2334.2, "total_tokens": 2207720} {"current_steps": 54, "total_steps": 1080, "loss": 0.3469, "lr": 4.9692208514878444e-05, "epoch": 0.9908256880733946, "percentage": 5.0, "elapsed_time": "0:15:57", "remaining_time": "5:03:16", "throughput": 2335.18, "total_tokens": 2236392} {"current_steps": 55, "total_steps": 1080, "loss": 0.4284, "lr": 4.9680727827934354e-05, "epoch": 1.0, "percentage": 5.09, "elapsed_time": "0:16:08", "remaining_time": "5:00:43", "throughput": 2333.32, "total_tokens": 2259088} {"current_steps": 56, "total_steps": 1080, "loss": 0.4186, "lr": 4.966903830281449e-05, "epoch": 1.018348623853211, "percentage": 5.19, "elapsed_time": "0:16:24", "remaining_time": "4:59:54", "throughput": 2335.7, "total_tokens": 2298496} {"current_steps": 57, "total_steps": 1080, "loss": 0.4696, "lr": 4.965714003843079e-05, "epoch": 1.036697247706422, "percentage": 5.28, "elapsed_time": "0:16:38", "remaining_time": "4:58:33", "throughput": 2337.46, "total_tokens": 2333016} {"current_steps": 58, "total_steps": 1080, "loss": 0.3905, "lr": 4.9645033135461494e-05, "epoch": 1.0550458715596331, "percentage": 5.37, "elapsed_time": "0:16:52", "remaining_time": "4:57:20", "throughput": 2338.86, "total_tokens": 2367992} {"current_steps": 59, "total_steps": 1080, "loss": 0.3588, "lr": 4.963271769635024e-05, "epoch": 1.073394495412844, "percentage": 5.46, "elapsed_time": "0:17:15", "remaining_time": "4:58:41", "throughput": 2332.28, "total_tokens": 2415328} {"current_steps": 60, "total_steps": 1080, "loss": 0.5532, "lr": 4.962019382530521e-05, "epoch": 1.091743119266055, "percentage": 5.56, "elapsed_time": "0:17:31", "remaining_time": "4:57:52", "throughput": 2335.02, "total_tokens": 2454792} {"current_steps": 61, "total_steps": 1080, "loss": 0.331, "lr": 4.9607461628298244e-05, "epoch": 1.110091743119266, "percentage": 5.65, "elapsed_time": "0:17:50", "remaining_time": "4:57:56", "throughput": 2339.08, "total_tokens": 2503072} {"current_steps": 62, "total_steps": 1080, "loss": 0.3728, "lr": 4.9594521213063974e-05, "epoch": 1.1284403669724772, "percentage": 5.74, "elapsed_time": "0:18:08", "remaining_time": "4:57:52", "throughput": 2339.9, "total_tokens": 2546960} {"current_steps": 63, "total_steps": 1080, "loss": 0.4695, "lr": 4.958137268909887e-05, "epoch": 1.146788990825688, "percentage": 5.83, "elapsed_time": "0:18:28", "remaining_time": "4:58:12", "throughput": 2341.68, "total_tokens": 2595432} {"current_steps": 64, "total_steps": 1080, "loss": 0.3653, "lr": 4.9568016167660334e-05, "epoch": 1.165137614678899, "percentage": 5.93, "elapsed_time": "0:18:45", "remaining_time": "4:57:52", "throughput": 2339.5, "total_tokens": 2633912} {"current_steps": 65, "total_steps": 1080, "loss": 0.3498, "lr": 4.9554451761765766e-05, "epoch": 1.18348623853211, "percentage": 6.02, "elapsed_time": "0:19:03", "remaining_time": "4:57:42", "throughput": 2343.55, "total_tokens": 2680792} {"current_steps": 66, "total_steps": 1080, "loss": 0.4053, "lr": 4.9540679586191605e-05, "epoch": 1.2018348623853212, "percentage": 6.11, "elapsed_time": "0:19:19", "remaining_time": "4:56:48", "throughput": 2343.65, "total_tokens": 2716584} {"current_steps": 67, "total_steps": 1080, "loss": 0.4189, "lr": 4.952669975747232e-05, "epoch": 1.2201834862385321, "percentage": 6.2, "elapsed_time": "0:19:35", "remaining_time": "4:56:10", "throughput": 2345.83, "total_tokens": 2757088} {"current_steps": 68, "total_steps": 1080, "loss": 0.4994, "lr": 4.951251239389948e-05, "epoch": 1.238532110091743, "percentage": 6.3, "elapsed_time": "0:19:49", "remaining_time": "4:55:09", "throughput": 2349.38, "total_tokens": 2795664} {"current_steps": 69, "total_steps": 1080, "loss": 0.3275, "lr": 4.949811761552074e-05, "epoch": 1.2568807339449541, "percentage": 6.39, "elapsed_time": "0:20:09", "remaining_time": "4:55:20", "throughput": 2348.99, "total_tokens": 2840936} {"current_steps": 70, "total_steps": 1080, "loss": 0.4366, "lr": 4.948351554413879e-05, "epoch": 1.2752293577981653, "percentage": 6.48, "elapsed_time": "0:20:29", "remaining_time": "4:55:33", "throughput": 2348.78, "total_tokens": 2886768} {"current_steps": 71, "total_steps": 1080, "loss": 0.3916, "lr": 4.9468706303310355e-05, "epoch": 1.2935779816513762, "percentage": 6.57, "elapsed_time": "0:20:42", "remaining_time": "4:54:15", "throughput": 2349.78, "total_tokens": 2919328} {"current_steps": 72, "total_steps": 1080, "loss": 0.3249, "lr": 4.9453690018345144e-05, "epoch": 1.311926605504587, "percentage": 6.67, "elapsed_time": "0:21:02", "remaining_time": "4:54:31", "throughput": 2350.37, "total_tokens": 2966744} {"current_steps": 73, "total_steps": 1080, "loss": 0.3956, "lr": 4.943846681630479e-05, "epoch": 1.3302752293577982, "percentage": 6.76, "elapsed_time": "0:21:20", "remaining_time": "4:54:19", "throughput": 2349.13, "total_tokens": 3007248} {"current_steps": 74, "total_steps": 1080, "loss": 0.3956, "lr": 4.942303682600178e-05, "epoch": 1.3486238532110093, "percentage": 6.85, "elapsed_time": "0:21:37", "remaining_time": "4:54:02", "throughput": 2350.99, "total_tokens": 3050960} {"current_steps": 75, "total_steps": 1080, "loss": 0.3773, "lr": 4.940740017799833e-05, "epoch": 1.3669724770642202, "percentage": 6.94, "elapsed_time": "0:21:53", "remaining_time": "4:53:17", "throughput": 2351.86, "total_tokens": 3088592} {"current_steps": 76, "total_steps": 1080, "loss": 0.4, "lr": 4.939155700460536e-05, "epoch": 1.385321100917431, "percentage": 7.04, "elapsed_time": "0:22:17", "remaining_time": "4:54:31", "throughput": 2357.47, "total_tokens": 3153520} {"current_steps": 77, "total_steps": 1080, "loss": 0.4343, "lr": 4.9375507439881266e-05, "epoch": 1.4036697247706422, "percentage": 7.13, "elapsed_time": "0:22:37", "remaining_time": "4:54:48", "throughput": 2355.95, "total_tokens": 3199272} {"current_steps": 78, "total_steps": 1080, "loss": 0.3881, "lr": 4.9359251619630886e-05, "epoch": 1.4220183486238533, "percentage": 7.22, "elapsed_time": "0:22:58", "remaining_time": "4:55:06", "throughput": 2355.76, "total_tokens": 3247128} {"current_steps": 79, "total_steps": 1080, "loss": 0.3972, "lr": 4.9342789681404275e-05, "epoch": 1.4403669724770642, "percentage": 7.31, "elapsed_time": "0:23:19", "remaining_time": "4:55:31", "throughput": 2354.01, "total_tokens": 3294192} {"current_steps": 80, "total_steps": 1080, "loss": 0.3438, "lr": 4.9326121764495596e-05, "epoch": 1.4587155963302751, "percentage": 7.41, "elapsed_time": "0:23:34", "remaining_time": "4:54:45", "throughput": 2353.47, "total_tokens": 3329736} {"current_steps": 81, "total_steps": 1080, "loss": 0.3189, "lr": 4.9309248009941914e-05, "epoch": 1.4770642201834863, "percentage": 7.5, "elapsed_time": "0:23:51", "remaining_time": "4:54:18", "throughput": 2354.75, "total_tokens": 3371376} {"current_steps": 82, "total_steps": 1080, "loss": 0.401, "lr": 4.9292168560522014e-05, "epoch": 1.4954128440366974, "percentage": 7.59, "elapsed_time": "0:24:10", "remaining_time": "4:54:17", "throughput": 2352.03, "total_tokens": 3412368} {"current_steps": 83, "total_steps": 1080, "loss": 0.4973, "lr": 4.9274883560755156e-05, "epoch": 1.5137614678899083, "percentage": 7.69, "elapsed_time": "0:24:30", "remaining_time": "4:54:21", "throughput": 2349.82, "total_tokens": 3455000} {"current_steps": 84, "total_steps": 1080, "loss": 0.3768, "lr": 4.925739315689991e-05, "epoch": 1.5321100917431192, "percentage": 7.78, "elapsed_time": "0:24:43", "remaining_time": "4:53:12", "throughput": 2351.5, "total_tokens": 3488960} {"current_steps": 85, "total_steps": 1080, "loss": 0.2999, "lr": 4.92396974969529e-05, "epoch": 1.5504587155963303, "percentage": 7.87, "elapsed_time": "0:24:57", "remaining_time": "4:52:07", "throughput": 2351.75, "total_tokens": 3521320} {"current_steps": 86, "total_steps": 1080, "loss": 0.3638, "lr": 4.9221796730647516e-05, "epoch": 1.5688073394495414, "percentage": 7.96, "elapsed_time": "0:25:15", "remaining_time": "4:51:58", "throughput": 2348.36, "total_tokens": 3559464} {"current_steps": 87, "total_steps": 1080, "loss": 0.3919, "lr": 4.92036910094527e-05, "epoch": 1.5871559633027523, "percentage": 8.06, "elapsed_time": "0:25:30", "remaining_time": "4:51:09", "throughput": 2350.84, "total_tokens": 3598080} {"current_steps": 88, "total_steps": 1080, "loss": 0.3626, "lr": 4.9185380486571595e-05, "epoch": 1.6055045871559632, "percentage": 8.15, "elapsed_time": "0:25:44", "remaining_time": "4:50:14", "throughput": 2349.74, "total_tokens": 3630064} {"current_steps": 89, "total_steps": 1080, "loss": 0.3439, "lr": 4.916686531694035e-05, "epoch": 1.6238532110091743, "percentage": 8.24, "elapsed_time": "0:25:57", "remaining_time": "4:48:59", "throughput": 2351.21, "total_tokens": 3661408} {"current_steps": 90, "total_steps": 1080, "loss": 0.3236, "lr": 4.914814565722671e-05, "epoch": 1.6422018348623855, "percentage": 8.33, "elapsed_time": "0:26:11", "remaining_time": "4:48:05", "throughput": 2351.75, "total_tokens": 3695480} {"current_steps": 91, "total_steps": 1080, "loss": 0.4255, "lr": 4.912922166582874e-05, "epoch": 1.6605504587155964, "percentage": 8.43, "elapsed_time": "0:26:29", "remaining_time": "4:47:56", "throughput": 2349.33, "total_tokens": 3734560} {"current_steps": 92, "total_steps": 1080, "loss": 0.3061, "lr": 4.9110093502873476e-05, "epoch": 1.6788990825688073, "percentage": 8.52, "elapsed_time": "0:26:43", "remaining_time": "4:47:02", "throughput": 2352.71, "total_tokens": 3773112} {"current_steps": 93, "total_steps": 1080, "loss": 0.3275, "lr": 4.909076133021557e-05, "epoch": 1.6972477064220184, "percentage": 8.61, "elapsed_time": "0:26:59", "remaining_time": "4:46:22", "throughput": 2355.35, "total_tokens": 3813392} {"current_steps": 94, "total_steps": 1080, "loss": 0.4179, "lr": 4.907122531143594e-05, "epoch": 1.7155963302752295, "percentage": 8.7, "elapsed_time": "0:27:19", "remaining_time": "4:46:37", "throughput": 2352.15, "total_tokens": 3856416} {"current_steps": 95, "total_steps": 1080, "loss": 0.3593, "lr": 4.905148561184033e-05, "epoch": 1.7339449541284404, "percentage": 8.8, "elapsed_time": "0:27:37", "remaining_time": "4:46:23", "throughput": 2352.87, "total_tokens": 3899472} {"current_steps": 96, "total_steps": 1080, "loss": 0.5007, "lr": 4.9031542398457974e-05, "epoch": 1.7522935779816513, "percentage": 8.89, "elapsed_time": "0:28:03", "remaining_time": "4:47:37", "throughput": 2353.84, "total_tokens": 3962976} {"current_steps": 97, "total_steps": 1080, "loss": 0.3484, "lr": 4.9011395840040144e-05, "epoch": 1.7706422018348624, "percentage": 8.98, "elapsed_time": "0:28:17", "remaining_time": "4:46:41", "throughput": 2356.89, "total_tokens": 4000696} {"current_steps": 98, "total_steps": 1080, "loss": 0.2889, "lr": 4.8991046107058735e-05, "epoch": 1.7889908256880735, "percentage": 9.07, "elapsed_time": "0:28:36", "remaining_time": "4:46:38", "throughput": 2356.88, "total_tokens": 4045256} {"current_steps": 99, "total_steps": 1080, "loss": 0.2203, "lr": 4.8970493371704826e-05, "epoch": 1.8073394495412844, "percentage": 9.17, "elapsed_time": "0:28:49", "remaining_time": "4:45:39", "throughput": 2356.99, "total_tokens": 4076800} {"current_steps": 100, "total_steps": 1080, "loss": 0.3966, "lr": 4.894973780788722e-05, "epoch": 1.8256880733944953, "percentage": 9.26, "elapsed_time": "0:29:07", "remaining_time": "4:45:29", "throughput": 2356.97, "total_tokens": 4119840} {"current_steps": 101, "total_steps": 1080, "loss": 0.4417, "lr": 4.892877959123097e-05, "epoch": 1.8440366972477065, "percentage": 9.35, "elapsed_time": "0:29:27", "remaining_time": "4:45:31", "throughput": 2357.11, "total_tokens": 4165848} {"current_steps": 102, "total_steps": 1080, "loss": 0.4258, "lr": 4.890761889907589e-05, "epoch": 1.8623853211009176, "percentage": 9.44, "elapsed_time": "0:29:43", "remaining_time": "4:44:56", "throughput": 2357.05, "total_tokens": 4202824} {"current_steps": 103, "total_steps": 1080, "loss": 0.3952, "lr": 4.8886255910475054e-05, "epoch": 1.8807339449541285, "percentage": 9.54, "elapsed_time": "0:29:55", "remaining_time": "4:43:46", "throughput": 2358.63, "total_tokens": 4233888} {"current_steps": 104, "total_steps": 1080, "loss": 0.3241, "lr": 4.88646908061933e-05, "epoch": 1.8990825688073394, "percentage": 9.63, "elapsed_time": "0:30:08", "remaining_time": "4:42:56", "throughput": 2358.82, "total_tokens": 4267064} {"current_steps": 105, "total_steps": 1080, "loss": 0.4239, "lr": 4.884292376870567e-05, "epoch": 1.9174311926605505, "percentage": 9.72, "elapsed_time": "0:30:27", "remaining_time": "4:42:51", "throughput": 2359.5, "total_tokens": 4312536} {"current_steps": 106, "total_steps": 1080, "loss": 0.2579, "lr": 4.8820954982195905e-05, "epoch": 1.9357798165137616, "percentage": 9.81, "elapsed_time": "0:30:50", "remaining_time": "4:43:23", "throughput": 2354.32, "total_tokens": 4356656} {"current_steps": 107, "total_steps": 1080, "loss": 0.44, "lr": 4.879878463255483e-05, "epoch": 1.9541284403669725, "percentage": 9.91, "elapsed_time": "0:31:06", "remaining_time": "4:42:57", "throughput": 2356.87, "total_tokens": 4400216} {"current_steps": 108, "total_steps": 1080, "loss": 0.2662, "lr": 4.877641290737884e-05, "epoch": 1.9724770642201834, "percentage": 10.0, "elapsed_time": "0:31:22", "remaining_time": "4:42:20", "throughput": 2357.2, "total_tokens": 4436968} {"current_steps": 109, "total_steps": 1080, "loss": 0.4211, "lr": 4.875383999596828e-05, "epoch": 1.9908256880733946, "percentage": 10.09, "elapsed_time": "0:31:45", "remaining_time": "4:42:54", "throughput": 2355.41, "total_tokens": 4488232} {"current_steps": 110, "total_steps": 1080, "loss": 0.2499, "lr": 4.873106608932585e-05, "epoch": 2.0, "percentage": 10.19, "elapsed_time": "0:31:55", "remaining_time": "4:41:34", "throughput": 2358.23, "total_tokens": 4518176} {"current_steps": 111, "total_steps": 1080, "loss": 0.2722, "lr": 4.8708091380154984e-05, "epoch": 2.018348623853211, "percentage": 10.28, "elapsed_time": "0:32:15", "remaining_time": "4:41:40", "throughput": 2361.09, "total_tokens": 4570896} {"current_steps": 112, "total_steps": 1080, "loss": 0.2758, "lr": 4.868491606285823e-05, "epoch": 2.036697247706422, "percentage": 10.37, "elapsed_time": "0:32:36", "remaining_time": "4:41:45", "throughput": 2358.66, "total_tokens": 4613576} {"current_steps": 113, "total_steps": 1080, "loss": 0.3361, "lr": 4.866154033353561e-05, "epoch": 2.055045871559633, "percentage": 10.46, "elapsed_time": "0:32:50", "remaining_time": "4:41:04", "throughput": 2361.05, "total_tokens": 4652896} {"current_steps": 114, "total_steps": 1080, "loss": 0.2667, "lr": 4.8637964389982926e-05, "epoch": 2.073394495412844, "percentage": 10.56, "elapsed_time": "0:33:07", "remaining_time": "4:40:43", "throughput": 2361.59, "total_tokens": 4694256} {"current_steps": 115, "total_steps": 1080, "loss": 0.3628, "lr": 4.8614188431690125e-05, "epoch": 2.091743119266055, "percentage": 10.65, "elapsed_time": "0:33:31", "remaining_time": "4:41:18", "throughput": 2360.23, "total_tokens": 4747552} {"current_steps": 116, "total_steps": 1080, "loss": 0.3599, "lr": 4.859021265983959e-05, "epoch": 2.1100917431192663, "percentage": 10.74, "elapsed_time": "0:33:50", "remaining_time": "4:41:16", "throughput": 2360.76, "total_tokens": 4794080} {"current_steps": 117, "total_steps": 1080, "loss": 0.4262, "lr": 4.856603727730447e-05, "epoch": 2.128440366972477, "percentage": 10.83, "elapsed_time": "0:34:15", "remaining_time": "4:41:56", "throughput": 2358.81, "total_tokens": 4847912} {"current_steps": 118, "total_steps": 1080, "loss": 0.3118, "lr": 4.854166248864689e-05, "epoch": 2.146788990825688, "percentage": 10.93, "elapsed_time": "0:34:30", "remaining_time": "4:41:19", "throughput": 2359.58, "total_tokens": 4885480} {"current_steps": 119, "total_steps": 1080, "loss": 0.3725, "lr": 4.85170885001163e-05, "epoch": 2.165137614678899, "percentage": 11.02, "elapsed_time": "0:34:44", "remaining_time": "4:40:33", "throughput": 2360.93, "total_tokens": 4921240} {"current_steps": 120, "total_steps": 1080, "loss": 0.3816, "lr": 4.849231551964771e-05, "epoch": 2.18348623853211, "percentage": 11.11, "elapsed_time": "0:35:00", "remaining_time": "4:40:01", "throughput": 2361.85, "total_tokens": 4960224} {"current_steps": 121, "total_steps": 1080, "loss": 0.3383, "lr": 4.846734375685989e-05, "epoch": 2.2018348623853212, "percentage": 11.2, "elapsed_time": "0:35:12", "remaining_time": "4:39:00", "throughput": 2362.67, "total_tokens": 4990536} {"current_steps": 122, "total_steps": 1080, "loss": 0.3011, "lr": 4.844217342305363e-05, "epoch": 2.220183486238532, "percentage": 11.3, "elapsed_time": "0:35:37", "remaining_time": "4:39:46", "throughput": 2359.63, "total_tokens": 5044296} {"current_steps": 123, "total_steps": 1080, "loss": 0.4458, "lr": 4.8416804731209945e-05, "epoch": 2.238532110091743, "percentage": 11.39, "elapsed_time": "0:35:55", "remaining_time": "4:39:30", "throughput": 2360.74, "total_tokens": 5088368} {"current_steps": 124, "total_steps": 1080, "loss": 0.2564, "lr": 4.839123789598829e-05, "epoch": 2.2568807339449544, "percentage": 11.48, "elapsed_time": "0:36:13", "remaining_time": "4:39:15", "throughput": 2362.03, "total_tokens": 5133472} {"current_steps": 125, "total_steps": 1080, "loss": 0.313, "lr": 4.836547313372471e-05, "epoch": 2.2752293577981653, "percentage": 11.57, "elapsed_time": "0:36:27", "remaining_time": "4:38:34", "throughput": 2362.1, "total_tokens": 5167768} {"current_steps": 126, "total_steps": 1080, "loss": 0.2963, "lr": 4.8339510662430046e-05, "epoch": 2.293577981651376, "percentage": 11.67, "elapsed_time": "0:36:43", "remaining_time": "4:38:07", "throughput": 2363.66, "total_tokens": 5209400} {"current_steps": 127, "total_steps": 1080, "loss": 0.2566, "lr": 4.8313350701788054e-05, "epoch": 2.311926605504587, "percentage": 11.76, "elapsed_time": "0:36:58", "remaining_time": "4:37:26", "throughput": 2366.36, "total_tokens": 5249360} {"current_steps": 128, "total_steps": 1080, "loss": 0.2833, "lr": 4.828699347315356e-05, "epoch": 2.330275229357798, "percentage": 11.85, "elapsed_time": "0:37:19", "remaining_time": "4:37:36", "throughput": 2366.87, "total_tokens": 5300808} {"current_steps": 129, "total_steps": 1080, "loss": 0.3099, "lr": 4.826043919955062e-05, "epoch": 2.3486238532110093, "percentage": 11.94, "elapsed_time": "0:37:31", "remaining_time": "4:36:41", "throughput": 2368.15, "total_tokens": 5332960} {"current_steps": 130, "total_steps": 1080, "loss": 0.3238, "lr": 4.823368810567056e-05, "epoch": 2.36697247706422, "percentage": 12.04, "elapsed_time": "0:37:44", "remaining_time": "4:35:51", "throughput": 2368.74, "total_tokens": 5365008} {"current_steps": 131, "total_steps": 1080, "loss": 0.3153, "lr": 4.820674041787017e-05, "epoch": 2.385321100917431, "percentage": 12.13, "elapsed_time": "0:37:57", "remaining_time": "4:35:01", "throughput": 2370.65, "total_tokens": 5400184} {"current_steps": 132, "total_steps": 1080, "loss": 0.2997, "lr": 4.817959636416969e-05, "epoch": 2.4036697247706424, "percentage": 12.22, "elapsed_time": "0:38:14", "remaining_time": "4:34:37", "throughput": 2371.13, "total_tokens": 5440320} {"current_steps": 133, "total_steps": 1080, "loss": 0.2373, "lr": 4.815225617425095e-05, "epoch": 2.4220183486238533, "percentage": 12.31, "elapsed_time": "0:38:30", "remaining_time": "4:34:08", "throughput": 2372.61, "total_tokens": 5480832} {"current_steps": 134, "total_steps": 1080, "loss": 0.2456, "lr": 4.81247200794554e-05, "epoch": 2.4403669724770642, "percentage": 12.41, "elapsed_time": "0:38:48", "remaining_time": "4:34:00", "throughput": 2373.34, "total_tokens": 5526936} {"current_steps": 135, "total_steps": 1080, "loss": 0.2099, "lr": 4.8096988312782174e-05, "epoch": 2.458715596330275, "percentage": 12.5, "elapsed_time": "0:39:06", "remaining_time": "4:33:43", "throughput": 2372.47, "total_tokens": 5566384} {"current_steps": 136, "total_steps": 1080, "loss": 0.3485, "lr": 4.806906110888606e-05, "epoch": 2.477064220183486, "percentage": 12.59, "elapsed_time": "0:39:34", "remaining_time": "4:34:42", "throughput": 2370.86, "total_tokens": 5629896} {"current_steps": 137, "total_steps": 1080, "loss": 0.2231, "lr": 4.80409387040756e-05, "epoch": 2.4954128440366974, "percentage": 12.69, "elapsed_time": "0:39:50", "remaining_time": "4:34:17", "throughput": 2373.36, "total_tokens": 5674504} {"current_steps": 138, "total_steps": 1080, "loss": 0.4285, "lr": 4.8012621336311016e-05, "epoch": 2.5137614678899083, "percentage": 12.78, "elapsed_time": "0:40:06", "remaining_time": "4:33:48", "throughput": 2374.21, "total_tokens": 5714000} {"current_steps": 139, "total_steps": 1080, "loss": 0.3343, "lr": 4.798410924520223e-05, "epoch": 2.532110091743119, "percentage": 12.87, "elapsed_time": "0:40:23", "remaining_time": "4:33:28", "throughput": 2375.21, "total_tokens": 5756856} {"current_steps": 140, "total_steps": 1080, "loss": 0.2497, "lr": 4.7955402672006854e-05, "epoch": 2.5504587155963305, "percentage": 12.96, "elapsed_time": "0:40:35", "remaining_time": "4:32:31", "throughput": 2373.93, "total_tokens": 5781192} {"current_steps": 141, "total_steps": 1080, "loss": 0.2991, "lr": 4.79265018596281e-05, "epoch": 2.5688073394495414, "percentage": 13.06, "elapsed_time": "0:40:54", "remaining_time": "4:32:28", "throughput": 2372.41, "total_tokens": 5824024} {"current_steps": 142, "total_steps": 1080, "loss": 0.2406, "lr": 4.789740705261278e-05, "epoch": 2.5871559633027523, "percentage": 13.15, "elapsed_time": "0:41:11", "remaining_time": "4:32:02", "throughput": 2372.52, "total_tokens": 5862584} {"current_steps": 143, "total_steps": 1080, "loss": 0.2722, "lr": 4.786811849714918e-05, "epoch": 2.6055045871559632, "percentage": 13.24, "elapsed_time": "0:41:26", "remaining_time": "4:31:29", "throughput": 2372.2, "total_tokens": 5897344} {"current_steps": 144, "total_steps": 1080, "loss": 0.374, "lr": 4.783863644106502e-05, "epoch": 2.623853211009174, "percentage": 13.33, "elapsed_time": "0:41:41", "remaining_time": "4:31:00", "throughput": 2371.18, "total_tokens": 5931736} {"current_steps": 145, "total_steps": 1080, "loss": 0.3386, "lr": 4.780896113382536e-05, "epoch": 2.6422018348623855, "percentage": 13.43, "elapsed_time": "0:41:58", "remaining_time": "4:30:40", "throughput": 2371.54, "total_tokens": 5972784} {"current_steps": 146, "total_steps": 1080, "loss": 0.2289, "lr": 4.777909282653042e-05, "epoch": 2.6605504587155964, "percentage": 13.52, "elapsed_time": "0:42:17", "remaining_time": "4:30:33", "throughput": 2371.9, "total_tokens": 6018968} {"current_steps": 147, "total_steps": 1080, "loss": 0.4061, "lr": 4.7749031771913584e-05, "epoch": 2.6788990825688073, "percentage": 13.61, "elapsed_time": "0:42:34", "remaining_time": "4:30:16", "throughput": 2372.81, "total_tokens": 6062520} {"current_steps": 148, "total_steps": 1080, "loss": 0.2198, "lr": 4.771877822433911e-05, "epoch": 2.6972477064220186, "percentage": 13.7, "elapsed_time": "0:42:45", "remaining_time": "4:29:17", "throughput": 2372.73, "total_tokens": 6087928} {"current_steps": 149, "total_steps": 1080, "loss": 0.34, "lr": 4.7688332439800096e-05, "epoch": 2.7155963302752295, "percentage": 13.8, "elapsed_time": "0:43:05", "remaining_time": "4:29:16", "throughput": 2372.52, "total_tokens": 6134792} {"current_steps": 150, "total_steps": 1080, "loss": 0.3292, "lr": 4.765769467591625e-05, "epoch": 2.7339449541284404, "percentage": 13.89, "elapsed_time": "0:43:25", "remaining_time": "4:29:11", "throughput": 2373.48, "total_tokens": 6183296} {"current_steps": 151, "total_steps": 1080, "loss": 0.2539, "lr": 4.762686519193175e-05, "epoch": 2.7522935779816513, "percentage": 13.98, "elapsed_time": "0:43:43", "remaining_time": "4:28:57", "throughput": 2373.56, "total_tokens": 6225840} {"current_steps": 152, "total_steps": 1080, "loss": 0.3571, "lr": 4.759584424871302e-05, "epoch": 2.770642201834862, "percentage": 14.07, "elapsed_time": "0:44:05", "remaining_time": "4:29:10", "throughput": 2372.06, "total_tokens": 6274760} {"current_steps": 153, "total_steps": 1080, "loss": 0.2783, "lr": 4.756463210874652e-05, "epoch": 2.7889908256880735, "percentage": 14.17, "elapsed_time": "0:44:24", "remaining_time": "4:29:06", "throughput": 2373.83, "total_tokens": 6326168} {"current_steps": 154, "total_steps": 1080, "loss": 0.2925, "lr": 4.7533229036136553e-05, "epoch": 2.8073394495412844, "percentage": 14.26, "elapsed_time": "0:44:40", "remaining_time": "4:28:39", "throughput": 2372.58, "total_tokens": 6360312} {"current_steps": 155, "total_steps": 1080, "loss": 0.2606, "lr": 4.750163529660303e-05, "epoch": 2.8256880733944953, "percentage": 14.35, "elapsed_time": "0:44:55", "remaining_time": "4:28:05", "throughput": 2372.77, "total_tokens": 6395496} {"current_steps": 156, "total_steps": 1080, "loss": 0.3721, "lr": 4.7469851157479177e-05, "epoch": 2.8440366972477067, "percentage": 14.44, "elapsed_time": "0:45:12", "remaining_time": "4:27:44", "throughput": 2373.43, "total_tokens": 6437064} {"current_steps": 157, "total_steps": 1080, "loss": 0.3931, "lr": 4.743787688770932e-05, "epoch": 2.8623853211009176, "percentage": 14.54, "elapsed_time": "0:45:29", "remaining_time": "4:27:27", "throughput": 2373.01, "total_tokens": 6477616} {"current_steps": 158, "total_steps": 1080, "loss": 0.2201, "lr": 4.740571275784659e-05, "epoch": 2.8807339449541285, "percentage": 14.63, "elapsed_time": "0:45:47", "remaining_time": "4:27:11", "throughput": 2372.73, "total_tokens": 6518680} {"current_steps": 159, "total_steps": 1080, "loss": 0.2579, "lr": 4.737335904005063e-05, "epoch": 2.8990825688073394, "percentage": 14.72, "elapsed_time": "0:45:59", "remaining_time": "4:26:23", "throughput": 2373.58, "total_tokens": 6549768} {"current_steps": 160, "total_steps": 1080, "loss": 0.2575, "lr": 4.734081600808531e-05, "epoch": 2.9174311926605503, "percentage": 14.81, "elapsed_time": "0:46:12", "remaining_time": "4:25:44", "throughput": 2373.29, "total_tokens": 6581000} {"current_steps": 161, "total_steps": 1080, "loss": 0.2597, "lr": 4.730808393731639e-05, "epoch": 2.9357798165137616, "percentage": 14.91, "elapsed_time": "0:46:26", "remaining_time": "4:25:02", "throughput": 2373.5, "total_tokens": 6612632} {"current_steps": 162, "total_steps": 1080, "loss": 0.3335, "lr": 4.72751631047092e-05, "epoch": 2.9541284403669725, "percentage": 15.0, "elapsed_time": "0:46:42", "remaining_time": "4:24:42", "throughput": 2374.13, "total_tokens": 6654288} {"current_steps": 163, "total_steps": 1080, "loss": 0.374, "lr": 4.72420537888263e-05, "epoch": 2.9724770642201834, "percentage": 15.09, "elapsed_time": "0:47:07", "remaining_time": "4:25:07", "throughput": 2372.1, "total_tokens": 6707208} {"current_steps": 164, "total_steps": 1080, "loss": 0.3477, "lr": 4.7208756269825104e-05, "epoch": 2.9908256880733948, "percentage": 15.19, "elapsed_time": "0:47:25", "remaining_time": "4:24:54", "throughput": 2371.41, "total_tokens": 6748448} {"current_steps": 165, "total_steps": 1080, "loss": 0.3214, "lr": 4.717527082945554e-05, "epoch": 3.0, "percentage": 15.28, "elapsed_time": "0:47:37", "remaining_time": "4:24:07", "throughput": 2371.59, "total_tokens": 6777264} {"current_steps": 166, "total_steps": 1080, "loss": 0.2681, "lr": 4.714159775105765e-05, "epoch": 3.018348623853211, "percentage": 15.37, "elapsed_time": "0:47:50", "remaining_time": "4:23:23", "throughput": 2372.44, "total_tokens": 6809456} {"current_steps": 167, "total_steps": 1080, "loss": 0.2633, "lr": 4.7107737319559176e-05, "epoch": 3.036697247706422, "percentage": 15.46, "elapsed_time": "0:48:04", "remaining_time": "4:22:51", "throughput": 2372.96, "total_tokens": 6845768} {"current_steps": 168, "total_steps": 1080, "loss": 0.1961, "lr": 4.707368982147318e-05, "epoch": 3.055045871559633, "percentage": 15.56, "elapsed_time": "0:48:28", "remaining_time": "4:23:07", "throughput": 2370.17, "total_tokens": 6893056} {"current_steps": 169, "total_steps": 1080, "loss": 0.2836, "lr": 4.703945554489558e-05, "epoch": 3.073394495412844, "percentage": 15.65, "elapsed_time": "0:48:45", "remaining_time": "4:22:47", "throughput": 2370.06, "total_tokens": 6932480} {"current_steps": 170, "total_steps": 1080, "loss": 0.2838, "lr": 4.700503477950278e-05, "epoch": 3.091743119266055, "percentage": 15.74, "elapsed_time": "0:49:04", "remaining_time": "4:22:40", "throughput": 2369.4, "total_tokens": 6975992} {"current_steps": 171, "total_steps": 1080, "loss": 0.3489, "lr": 4.697042781654913e-05, "epoch": 3.1100917431192663, "percentage": 15.83, "elapsed_time": "0:49:21", "remaining_time": "4:22:24", "throughput": 2370.73, "total_tokens": 7021840} {"current_steps": 172, "total_steps": 1080, "loss": 0.3797, "lr": 4.693563494886455e-05, "epoch": 3.128440366972477, "percentage": 15.93, "elapsed_time": "0:49:39", "remaining_time": "4:22:08", "throughput": 2371.27, "total_tokens": 7065192} {"current_steps": 173, "total_steps": 1080, "loss": 0.2046, "lr": 4.6900656470851964e-05, "epoch": 3.146788990825688, "percentage": 16.02, "elapsed_time": "0:50:00", "remaining_time": "4:22:12", "throughput": 2370.87, "total_tokens": 7114544} {"current_steps": 174, "total_steps": 1080, "loss": 0.2596, "lr": 4.6865492678484895e-05, "epoch": 3.165137614678899, "percentage": 16.11, "elapsed_time": "0:50:17", "remaining_time": "4:21:53", "throughput": 2370.21, "total_tokens": 7152736} {"current_steps": 175, "total_steps": 1080, "loss": 0.3045, "lr": 4.68301438693049e-05, "epoch": 3.18348623853211, "percentage": 16.2, "elapsed_time": "0:50:41", "remaining_time": "4:22:09", "throughput": 2369.62, "total_tokens": 7207464} {"current_steps": 176, "total_steps": 1080, "loss": 0.2096, "lr": 4.679461034241906e-05, "epoch": 3.2018348623853212, "percentage": 16.3, "elapsed_time": "0:50:55", "remaining_time": "4:21:32", "throughput": 2369.3, "total_tokens": 7238640} {"current_steps": 177, "total_steps": 1080, "loss": 0.2226, "lr": 4.6758892398497494e-05, "epoch": 3.220183486238532, "percentage": 16.39, "elapsed_time": "0:51:11", "remaining_time": "4:21:11", "throughput": 2369.63, "total_tokens": 7279112} {"current_steps": 178, "total_steps": 1080, "loss": 0.2403, "lr": 4.672299033977076e-05, "epoch": 3.238532110091743, "percentage": 16.48, "elapsed_time": "0:51:25", "remaining_time": "4:20:37", "throughput": 2369.4, "total_tokens": 7311632} {"current_steps": 179, "total_steps": 1080, "loss": 0.2156, "lr": 4.6686904470027316e-05, "epoch": 3.2568807339449544, "percentage": 16.57, "elapsed_time": "0:51:38", "remaining_time": "4:19:58", "throughput": 2370.18, "total_tokens": 7344864} {"current_steps": 180, "total_steps": 1080, "loss": 0.238, "lr": 4.665063509461097e-05, "epoch": 3.2752293577981653, "percentage": 16.67, "elapsed_time": "0:51:58", "remaining_time": "4:19:50", "throughput": 2369.98, "total_tokens": 7389944} {"current_steps": 181, "total_steps": 1080, "loss": 0.2251, "lr": 4.661418252041827e-05, "epoch": 3.293577981651376, "percentage": 16.76, "elapsed_time": "0:52:12", "remaining_time": "4:19:17", "throughput": 2370.11, "total_tokens": 7423672} {"current_steps": 182, "total_steps": 1080, "loss": 0.2922, "lr": 4.657754705589591e-05, "epoch": 3.311926605504587, "percentage": 16.85, "elapsed_time": "0:52:27", "remaining_time": "4:18:50", "throughput": 2369.91, "total_tokens": 7459576} {"current_steps": 183, "total_steps": 1080, "loss": 0.2698, "lr": 4.6540729011038146e-05, "epoch": 3.330275229357798, "percentage": 16.94, "elapsed_time": "0:52:47", "remaining_time": "4:18:48", "throughput": 2371.14, "total_tokens": 7511736} {"current_steps": 184, "total_steps": 1080, "loss": 0.173, "lr": 4.650372869738414e-05, "epoch": 3.3486238532110093, "percentage": 17.04, "elapsed_time": "0:53:06", "remaining_time": "4:18:36", "throughput": 2372.11, "total_tokens": 7558552} {"current_steps": 185, "total_steps": 1080, "loss": 0.32, "lr": 4.6466546428015336e-05, "epoch": 3.36697247706422, "percentage": 17.13, "elapsed_time": "0:53:23", "remaining_time": "4:18:16", "throughput": 2372.3, "total_tokens": 7599040} {"current_steps": 186, "total_steps": 1080, "loss": 0.3058, "lr": 4.642918251755281e-05, "epoch": 3.385321100917431, "percentage": 17.22, "elapsed_time": "0:53:46", "remaining_time": "4:18:27", "throughput": 2372.06, "total_tokens": 7653264} {"current_steps": 187, "total_steps": 1080, "loss": 0.1896, "lr": 4.639163728215463e-05, "epoch": 3.4036697247706424, "percentage": 17.31, "elapsed_time": "0:54:02", "remaining_time": "4:18:06", "throughput": 2372.67, "total_tokens": 7694272} {"current_steps": 188, "total_steps": 1080, "loss": 0.2933, "lr": 4.6353911039513145e-05, "epoch": 3.4220183486238533, "percentage": 17.41, "elapsed_time": "0:54:18", "remaining_time": "4:17:38", "throughput": 2372.76, "total_tokens": 7730848} {"current_steps": 189, "total_steps": 1080, "loss": 0.2625, "lr": 4.6316004108852305e-05, "epoch": 3.4403669724770642, "percentage": 17.5, "elapsed_time": "0:54:39", "remaining_time": "4:17:39", "throughput": 2372.76, "total_tokens": 7781200} {"current_steps": 190, "total_steps": 1080, "loss": 0.3372, "lr": 4.627791681092499e-05, "epoch": 3.458715596330275, "percentage": 17.59, "elapsed_time": "0:54:56", "remaining_time": "4:17:19", "throughput": 2374.05, "total_tokens": 7825032} {"current_steps": 191, "total_steps": 1080, "loss": 0.2229, "lr": 4.623964946801027e-05, "epoch": 3.477064220183486, "percentage": 17.69, "elapsed_time": "0:55:08", "remaining_time": "4:16:40", "throughput": 2374.32, "total_tokens": 7855840} {"current_steps": 192, "total_steps": 1080, "loss": 0.3967, "lr": 4.620120240391065e-05, "epoch": 3.4954128440366974, "percentage": 17.78, "elapsed_time": "0:55:30", "remaining_time": "4:16:44", "throughput": 2373.72, "total_tokens": 7905928} {"current_steps": 193, "total_steps": 1080, "loss": 0.2254, "lr": 4.61625759439494e-05, "epoch": 3.5137614678899083, "percentage": 17.87, "elapsed_time": "0:55:53", "remaining_time": "4:16:50", "throughput": 2372.72, "total_tokens": 7955992} {"current_steps": 194, "total_steps": 1080, "loss": 0.2553, "lr": 4.612377041496776e-05, "epoch": 3.532110091743119, "percentage": 17.96, "elapsed_time": "0:56:10", "remaining_time": "4:16:33", "throughput": 2372.93, "total_tokens": 7998024} {"current_steps": 195, "total_steps": 1080, "loss": 0.2197, "lr": 4.608478614532215e-05, "epoch": 3.5504587155963305, "percentage": 18.06, "elapsed_time": "0:56:35", "remaining_time": "4:16:52", "throughput": 2372.15, "total_tokens": 8055672} {"current_steps": 196, "total_steps": 1080, "loss": 0.2507, "lr": 4.604562346488144e-05, "epoch": 3.5688073394495414, "percentage": 18.15, "elapsed_time": "0:56:51", "remaining_time": "4:16:24", "throughput": 2371.88, "total_tokens": 8090848} {"current_steps": 197, "total_steps": 1080, "loss": 0.2422, "lr": 4.6006282705024144e-05, "epoch": 3.5871559633027523, "percentage": 18.24, "elapsed_time": "0:57:09", "remaining_time": "4:16:10", "throughput": 2372.75, "total_tokens": 8136680} {"current_steps": 198, "total_steps": 1080, "loss": 0.2107, "lr": 4.5966764198635606e-05, "epoch": 3.6055045871559632, "percentage": 18.33, "elapsed_time": "0:57:32", "remaining_time": "4:16:21", "throughput": 2371.13, "total_tokens": 8187472} {"current_steps": 199, "total_steps": 1080, "loss": 0.1854, "lr": 4.592706828010518e-05, "epoch": 3.623853211009174, "percentage": 18.43, "elapsed_time": "0:57:49", "remaining_time": "4:15:57", "throughput": 2371.04, "total_tokens": 8225216} {"current_steps": 200, "total_steps": 1080, "loss": 0.1687, "lr": 4.588719528532342e-05, "epoch": 3.6422018348623855, "percentage": 18.52, "elapsed_time": "0:58:12", "remaining_time": "4:16:07", "throughput": 2369.16, "total_tokens": 8274456} {"current_steps": 201, "total_steps": 1080, "loss": 0.2549, "lr": 4.5847145551679206e-05, "epoch": 3.6605504587155964, "percentage": 18.61, "elapsed_time": "0:58:29", "remaining_time": "4:15:45", "throughput": 2370.11, "total_tokens": 8317016} {"current_steps": 202, "total_steps": 1080, "loss": 0.1602, "lr": 4.580691941805695e-05, "epoch": 3.6788990825688073, "percentage": 18.7, "elapsed_time": "0:58:47", "remaining_time": "4:15:31", "throughput": 2370.66, "total_tokens": 8361856} {"current_steps": 203, "total_steps": 1080, "loss": 0.2495, "lr": 4.5766517224833637e-05, "epoch": 3.6972477064220186, "percentage": 18.8, "elapsed_time": "0:59:05", "remaining_time": "4:15:18", "throughput": 2372.09, "total_tokens": 8410696} {"current_steps": 204, "total_steps": 1080, "loss": 0.2012, "lr": 4.572593931387604e-05, "epoch": 3.7155963302752295, "percentage": 18.89, "elapsed_time": "0:59:19", "remaining_time": "4:14:45", "throughput": 2371.56, "total_tokens": 8441872} {"current_steps": 205, "total_steps": 1080, "loss": 0.2373, "lr": 4.568518602853776e-05, "epoch": 3.7339449541284404, "percentage": 18.98, "elapsed_time": "0:59:35", "remaining_time": "4:14:21", "throughput": 2372.39, "total_tokens": 8482544} {"current_steps": 206, "total_steps": 1080, "loss": 0.233, "lr": 4.5644257713656356e-05, "epoch": 3.7522935779816513, "percentage": 19.07, "elapsed_time": "0:59:50", "remaining_time": "4:13:54", "throughput": 2372.77, "total_tokens": 8519856} {"current_steps": 207, "total_steps": 1080, "loss": 0.225, "lr": 4.5603154715550386e-05, "epoch": 3.770642201834862, "percentage": 19.17, "elapsed_time": "1:00:04", "remaining_time": "4:13:21", "throughput": 2372.49, "total_tokens": 8551392} {"current_steps": 208, "total_steps": 1080, "loss": 0.2975, "lr": 4.556187738201656e-05, "epoch": 3.7889908256880735, "percentage": 19.26, "elapsed_time": "1:00:24", "remaining_time": "4:13:13", "throughput": 2372.81, "total_tokens": 8599472} {"current_steps": 209, "total_steps": 1080, "loss": 0.2033, "lr": 4.552042606232668e-05, "epoch": 3.8073394495412844, "percentage": 19.35, "elapsed_time": "1:00:38", "remaining_time": "4:12:45", "throughput": 2372.09, "total_tokens": 8631880} {"current_steps": 210, "total_steps": 1080, "loss": 0.2024, "lr": 4.54788011072248e-05, "epoch": 3.8256880733944953, "percentage": 19.44, "elapsed_time": "1:00:57", "remaining_time": "4:12:33", "throughput": 2371.69, "total_tokens": 8675016} {"current_steps": 211, "total_steps": 1080, "loss": 0.2304, "lr": 4.5437002868924166e-05, "epoch": 3.8440366972477067, "percentage": 19.54, "elapsed_time": "1:01:13", "remaining_time": "4:12:10", "throughput": 2371.76, "total_tokens": 8713248} {"current_steps": 212, "total_steps": 1080, "loss": 0.2928, "lr": 4.539503170110431e-05, "epoch": 3.8623853211009176, "percentage": 19.63, "elapsed_time": "1:01:28", "remaining_time": "4:11:41", "throughput": 2372.06, "total_tokens": 8748800} {"current_steps": 213, "total_steps": 1080, "loss": 0.2214, "lr": 4.535288795890798e-05, "epoch": 3.8807339449541285, "percentage": 19.72, "elapsed_time": "1:01:46", "remaining_time": "4:11:25", "throughput": 2371.18, "total_tokens": 8787832} {"current_steps": 214, "total_steps": 1080, "loss": 0.2168, "lr": 4.531057199893824e-05, "epoch": 3.8990825688073394, "percentage": 19.81, "elapsed_time": "1:01:58", "remaining_time": "4:10:48", "throughput": 2371.78, "total_tokens": 8819616} {"current_steps": 215, "total_steps": 1080, "loss": 0.279, "lr": 4.526808417925531e-05, "epoch": 3.9174311926605503, "percentage": 19.91, "elapsed_time": "1:02:17", "remaining_time": "4:10:35", "throughput": 2370.99, "total_tokens": 8860744} {"current_steps": 216, "total_steps": 1080, "loss": 0.2597, "lr": 4.522542485937369e-05, "epoch": 3.9357798165137616, "percentage": 20.0, "elapsed_time": "1:02:35", "remaining_time": "4:10:23", "throughput": 2371.4, "total_tokens": 8906432} {"current_steps": 217, "total_steps": 1080, "loss": 0.241, "lr": 4.5182594400259e-05, "epoch": 3.9541284403669725, "percentage": 20.09, "elapsed_time": "1:02:57", "remaining_time": "4:10:23", "throughput": 2370.51, "total_tokens": 8955104} {"current_steps": 218, "total_steps": 1080, "loss": 0.2157, "lr": 4.5139593164324986e-05, "epoch": 3.9724770642201834, "percentage": 20.19, "elapsed_time": "1:03:12", "remaining_time": "4:09:56", "throughput": 2370.42, "total_tokens": 8990200} {"current_steps": 219, "total_steps": 1080, "loss": 0.2046, "lr": 4.509642151543043e-05, "epoch": 3.9908256880733948, "percentage": 20.28, "elapsed_time": "1:03:25", "remaining_time": "4:09:20", "throughput": 2370.56, "total_tokens": 9020760} {"current_steps": 220, "total_steps": 1080, "loss": 0.1714, "lr": 4.50530798188761e-05, "epoch": 4.0, "percentage": 20.37, "elapsed_time": "1:03:31", "remaining_time": "4:08:20", "throughput": 2370.68, "total_tokens": 9036352} {"current_steps": 221, "total_steps": 1080, "loss": 0.1811, "lr": 4.50095684414016e-05, "epoch": 4.018348623853211, "percentage": 20.46, "elapsed_time": "1:03:56", "remaining_time": "4:08:33", "throughput": 2369.61, "total_tokens": 9091776} {"current_steps": 222, "total_steps": 1080, "loss": 0.2101, "lr": 4.496588775118232e-05, "epoch": 4.036697247706422, "percentage": 20.56, "elapsed_time": "1:04:13", "remaining_time": "4:08:14", "throughput": 2370.09, "total_tokens": 9134080} {"current_steps": 223, "total_steps": 1080, "loss": 0.1444, "lr": 4.4922038117826334e-05, "epoch": 4.055045871559633, "percentage": 20.65, "elapsed_time": "1:04:31", "remaining_time": "4:07:56", "throughput": 2369.54, "total_tokens": 9172720} {"current_steps": 224, "total_steps": 1080, "loss": 0.2342, "lr": 4.48780199123712e-05, "epoch": 4.073394495412844, "percentage": 20.74, "elapsed_time": "1:04:48", "remaining_time": "4:07:39", "throughput": 2369.52, "total_tokens": 9213664} {"current_steps": 225, "total_steps": 1080, "loss": 0.1676, "lr": 4.4833833507280884e-05, "epoch": 4.091743119266055, "percentage": 20.83, "elapsed_time": "1:05:11", "remaining_time": "4:07:45", "throughput": 2367.53, "total_tokens": 9261768} {"current_steps": 226, "total_steps": 1080, "loss": 0.295, "lr": 4.478947927644258e-05, "epoch": 4.110091743119266, "percentage": 20.93, "elapsed_time": "1:05:27", "remaining_time": "4:07:19", "throughput": 2368.44, "total_tokens": 9300928} {"current_steps": 227, "total_steps": 1080, "loss": 0.17, "lr": 4.474495759516358e-05, "epoch": 4.128440366972477, "percentage": 21.02, "elapsed_time": "1:05:38", "remaining_time": "4:06:39", "throughput": 2368.81, "total_tokens": 9329472} {"current_steps": 228, "total_steps": 1080, "loss": 0.1759, "lr": 4.4700268840168045e-05, "epoch": 4.146788990825688, "percentage": 21.11, "elapsed_time": "1:05:54", "remaining_time": "4:06:17", "throughput": 2368.35, "total_tokens": 9365640} {"current_steps": 229, "total_steps": 1080, "loss": 0.1878, "lr": 4.4655413389593856e-05, "epoch": 4.165137614678899, "percentage": 21.2, "elapsed_time": "1:06:15", "remaining_time": "4:06:12", "throughput": 2367.29, "total_tokens": 9410552} {"current_steps": 230, "total_steps": 1080, "loss": 0.1637, "lr": 4.4610391622989396e-05, "epoch": 4.18348623853211, "percentage": 21.3, "elapsed_time": "1:06:32", "remaining_time": "4:05:55", "throughput": 2367.48, "total_tokens": 9452416} {"current_steps": 231, "total_steps": 1080, "loss": 0.2748, "lr": 4.456520392131035e-05, "epoch": 4.201834862385321, "percentage": 21.39, "elapsed_time": "1:06:54", "remaining_time": "4:05:53", "throughput": 2367.55, "total_tokens": 9503528} {"current_steps": 232, "total_steps": 1080, "loss": 0.2635, "lr": 4.4519850666916484e-05, "epoch": 4.220183486238533, "percentage": 21.48, "elapsed_time": "1:07:10", "remaining_time": "4:05:32", "throughput": 2367.22, "total_tokens": 9541592} {"current_steps": 233, "total_steps": 1080, "loss": 0.2027, "lr": 4.447433224356839e-05, "epoch": 4.238532110091743, "percentage": 21.57, "elapsed_time": "1:07:29", "remaining_time": "4:05:20", "throughput": 2367.29, "total_tokens": 9586064} {"current_steps": 234, "total_steps": 1080, "loss": 0.2107, "lr": 4.442864903642428e-05, "epoch": 4.256880733944954, "percentage": 21.67, "elapsed_time": "1:07:54", "remaining_time": "4:05:30", "throughput": 2366.36, "total_tokens": 9641688} {"current_steps": 235, "total_steps": 1080, "loss": 0.2879, "lr": 4.438280143203665e-05, "epoch": 4.275229357798165, "percentage": 21.76, "elapsed_time": "1:08:12", "remaining_time": "4:05:15", "throughput": 2366.88, "total_tokens": 9686240} {"current_steps": 236, "total_steps": 1080, "loss": 0.2594, "lr": 4.43367898183491e-05, "epoch": 4.293577981651376, "percentage": 21.85, "elapsed_time": "1:08:33", "remaining_time": "4:05:11", "throughput": 2366.71, "total_tokens": 9735632} {"current_steps": 237, "total_steps": 1080, "loss": 0.1907, "lr": 4.4290614584693004e-05, "epoch": 4.3119266055045875, "percentage": 21.94, "elapsed_time": "1:08:46", "remaining_time": "4:04:39", "throughput": 2366.57, "total_tokens": 9766536} {"current_steps": 238, "total_steps": 1080, "loss": 0.1805, "lr": 4.4244276121784195e-05, "epoch": 4.330275229357798, "percentage": 22.04, "elapsed_time": "1:09:00", "remaining_time": "4:04:06", "throughput": 2366.28, "total_tokens": 9796400} {"current_steps": 239, "total_steps": 1080, "loss": 0.1824, "lr": 4.4197774821719714e-05, "epoch": 4.348623853211009, "percentage": 22.13, "elapsed_time": "1:09:15", "remaining_time": "4:03:43", "throughput": 2365.86, "total_tokens": 9831992} {"current_steps": 240, "total_steps": 1080, "loss": 0.1721, "lr": 4.415111107797445e-05, "epoch": 4.36697247706422, "percentage": 22.22, "elapsed_time": "1:09:32", "remaining_time": "4:03:25", "throughput": 2366.57, "total_tokens": 9875640} {"current_steps": 241, "total_steps": 1080, "loss": 0.275, "lr": 4.410428528539783e-05, "epoch": 4.385321100917431, "percentage": 22.31, "elapsed_time": "1:09:50", "remaining_time": "4:03:08", "throughput": 2366.48, "total_tokens": 9916816} {"current_steps": 242, "total_steps": 1080, "loss": 0.1963, "lr": 4.405729784021046e-05, "epoch": 4.4036697247706424, "percentage": 22.41, "elapsed_time": "1:10:09", "remaining_time": "4:02:58", "throughput": 2366.55, "total_tokens": 9962928} {"current_steps": 243, "total_steps": 1080, "loss": 0.1626, "lr": 4.401014914000078e-05, "epoch": 4.422018348623853, "percentage": 22.5, "elapsed_time": "1:10:24", "remaining_time": "4:02:29", "throughput": 2366.72, "total_tokens": 9997224} {"current_steps": 244, "total_steps": 1080, "loss": 0.1733, "lr": 4.396283958372173e-05, "epoch": 4.440366972477064, "percentage": 22.59, "elapsed_time": "1:10:41", "remaining_time": "4:02:13", "throughput": 2365.98, "total_tokens": 10036248} {"current_steps": 245, "total_steps": 1080, "loss": 0.1936, "lr": 4.391536957168733e-05, "epoch": 4.458715596330276, "percentage": 22.69, "elapsed_time": "1:10:56", "remaining_time": "4:01:48", "throughput": 2365.64, "total_tokens": 10070312} {"current_steps": 246, "total_steps": 1080, "loss": 0.1847, "lr": 4.386773950556931e-05, "epoch": 4.477064220183486, "percentage": 22.78, "elapsed_time": "1:11:15", "remaining_time": "4:01:35", "throughput": 2365.69, "total_tokens": 10114568} {"current_steps": 247, "total_steps": 1080, "loss": 0.1981, "lr": 4.381994978839371e-05, "epoch": 4.495412844036697, "percentage": 22.87, "elapsed_time": "1:11:30", "remaining_time": "4:01:08", "throughput": 2365.95, "total_tokens": 10150280} {"current_steps": 248, "total_steps": 1080, "loss": 0.1681, "lr": 4.377200082453749e-05, "epoch": 4.513761467889909, "percentage": 22.96, "elapsed_time": "1:11:48", "remaining_time": "4:00:54", "throughput": 2366.05, "total_tokens": 10194000} {"current_steps": 249, "total_steps": 1080, "loss": 0.2111, "lr": 4.372389301972506e-05, "epoch": 4.532110091743119, "percentage": 23.06, "elapsed_time": "1:12:04", "remaining_time": "4:00:30", "throughput": 2366.38, "total_tokens": 10232264} {"current_steps": 250, "total_steps": 1080, "loss": 0.2307, "lr": 4.36756267810249e-05, "epoch": 4.5504587155963305, "percentage": 23.15, "elapsed_time": "1:12:19", "remaining_time": "4:00:06", "throughput": 2367.1, "total_tokens": 10271880} {"current_steps": 251, "total_steps": 1080, "loss": 0.1609, "lr": 4.36272025168461e-05, "epoch": 4.568807339449541, "percentage": 23.24, "elapsed_time": "1:12:38", "remaining_time": "3:59:55", "throughput": 2367.17, "total_tokens": 10317720} {"current_steps": 252, "total_steps": 1080, "loss": 0.2456, "lr": 4.357862063693486e-05, "epoch": 4.587155963302752, "percentage": 23.33, "elapsed_time": "1:12:57", "remaining_time": "3:59:42", "throughput": 2367.29, "total_tokens": 10362168} {"current_steps": 253, "total_steps": 1080, "loss": 0.3159, "lr": 4.3529881552371096e-05, "epoch": 4.605504587155964, "percentage": 23.43, "elapsed_time": "1:13:21", "remaining_time": "3:59:48", "throughput": 2365.92, "total_tokens": 10414312} {"current_steps": 254, "total_steps": 1080, "loss": 0.2194, "lr": 4.34809856755649e-05, "epoch": 4.623853211009174, "percentage": 23.52, "elapsed_time": "1:13:38", "remaining_time": "3:59:28", "throughput": 2365.58, "total_tokens": 10451800} {"current_steps": 255, "total_steps": 1080, "loss": 0.1846, "lr": 4.34319334202531e-05, "epoch": 4.6422018348623855, "percentage": 23.61, "elapsed_time": "1:13:56", "remaining_time": "3:59:12", "throughput": 2366.07, "total_tokens": 10496224} {"current_steps": 256, "total_steps": 1080, "loss": 0.1906, "lr": 4.3382725201495723e-05, "epoch": 4.660550458715596, "percentage": 23.7, "elapsed_time": "1:14:11", "remaining_time": "3:58:47", "throughput": 2366.98, "total_tokens": 10536392} {"current_steps": 257, "total_steps": 1080, "loss": 0.1793, "lr": 4.333336143567247e-05, "epoch": 4.678899082568807, "percentage": 23.8, "elapsed_time": "1:14:28", "remaining_time": "3:58:31", "throughput": 2366.89, "total_tokens": 10577640} {"current_steps": 258, "total_steps": 1080, "loss": 0.1576, "lr": 4.3283842540479264e-05, "epoch": 4.697247706422019, "percentage": 23.89, "elapsed_time": "1:14:44", "remaining_time": "3:58:07", "throughput": 2366.65, "total_tokens": 10613376} {"current_steps": 259, "total_steps": 1080, "loss": 0.1447, "lr": 4.3234168934924636e-05, "epoch": 4.715596330275229, "percentage": 23.98, "elapsed_time": "1:14:58", "remaining_time": "3:57:40", "throughput": 2366.66, "total_tokens": 10647232} {"current_steps": 260, "total_steps": 1080, "loss": 0.1488, "lr": 4.318434103932622e-05, "epoch": 4.73394495412844, "percentage": 24.07, "elapsed_time": "1:15:20", "remaining_time": "3:57:35", "throughput": 2366.28, "total_tokens": 10696024} {"current_steps": 261, "total_steps": 1080, "loss": 0.1597, "lr": 4.313435927530719e-05, "epoch": 4.752293577981652, "percentage": 24.17, "elapsed_time": "1:15:35", "remaining_time": "3:57:11", "throughput": 2365.93, "total_tokens": 10730408} {"current_steps": 262, "total_steps": 1080, "loss": 0.2266, "lr": 4.30842240657927e-05, "epoch": 4.770642201834862, "percentage": 24.26, "elapsed_time": "1:15:50", "remaining_time": "3:56:46", "throughput": 2365.68, "total_tokens": 10764776} {"current_steps": 263, "total_steps": 1080, "loss": 0.1562, "lr": 4.303393583500628e-05, "epoch": 4.7889908256880735, "percentage": 24.35, "elapsed_time": "1:16:01", "remaining_time": "3:56:09", "throughput": 2366.01, "total_tokens": 10792272} {"current_steps": 264, "total_steps": 1080, "loss": 0.1504, "lr": 4.2983495008466276e-05, "epoch": 4.807339449541285, "percentage": 24.44, "elapsed_time": "1:16:15", "remaining_time": "3:55:42", "throughput": 2365.86, "total_tokens": 10825240} {"current_steps": 265, "total_steps": 1080, "loss": 0.1648, "lr": 4.293290201298223e-05, "epoch": 4.825688073394495, "percentage": 24.54, "elapsed_time": "1:16:41", "remaining_time": "3:55:52", "throughput": 2365.1, "total_tokens": 10883592} {"current_steps": 266, "total_steps": 1080, "loss": 0.1652, "lr": 4.288215727665129e-05, "epoch": 4.844036697247707, "percentage": 24.63, "elapsed_time": "1:16:57", "remaining_time": "3:55:28", "throughput": 2365.73, "total_tokens": 10922640} {"current_steps": 267, "total_steps": 1080, "loss": 0.1817, "lr": 4.2831261228854544e-05, "epoch": 4.862385321100917, "percentage": 24.72, "elapsed_time": "1:17:14", "remaining_time": "3:55:11", "throughput": 2366.42, "total_tokens": 10967288} {"current_steps": 268, "total_steps": 1080, "loss": 0.2066, "lr": 4.278021430025343e-05, "epoch": 4.8807339449541285, "percentage": 24.81, "elapsed_time": "1:17:34", "remaining_time": "3:55:01", "throughput": 2365.82, "total_tokens": 11011152} {"current_steps": 269, "total_steps": 1080, "loss": 0.1522, "lr": 4.272901692278609e-05, "epoch": 4.89908256880734, "percentage": 24.91, "elapsed_time": "1:17:53", "remaining_time": "3:54:49", "throughput": 2365.6, "total_tokens": 11055608} {"current_steps": 270, "total_steps": 1080, "loss": 0.2201, "lr": 4.267766952966369e-05, "epoch": 4.91743119266055, "percentage": 25.0, "elapsed_time": "1:18:13", "remaining_time": "3:54:41", "throughput": 2365.18, "total_tokens": 11101992} {"current_steps": 271, "total_steps": 1080, "loss": 0.2777, "lr": 4.262617255536676e-05, "epoch": 4.935779816513762, "percentage": 25.09, "elapsed_time": "1:18:32", "remaining_time": "3:54:27", "throughput": 2364.32, "total_tokens": 11141408} {"current_steps": 272, "total_steps": 1080, "loss": 0.1857, "lr": 4.257452643564155e-05, "epoch": 4.954128440366972, "percentage": 25.19, "elapsed_time": "1:18:51", "remaining_time": "3:54:14", "throughput": 2364.19, "total_tokens": 11185344} {"current_steps": 273, "total_steps": 1080, "loss": 0.1653, "lr": 4.2522731607496275e-05, "epoch": 4.972477064220183, "percentage": 25.28, "elapsed_time": "1:19:04", "remaining_time": "3:53:43", "throughput": 2364.27, "total_tokens": 11216160} {"current_steps": 274, "total_steps": 1080, "loss": 0.1761, "lr": 4.24707885091975e-05, "epoch": 4.990825688073395, "percentage": 25.37, "elapsed_time": "1:19:31", "remaining_time": "3:53:57", "throughput": 2363.04, "total_tokens": 11276200} {"current_steps": 275, "total_steps": 1080, "loss": 0.1582, "lr": 4.241869758026638e-05, "epoch": 5.0, "percentage": 25.46, "elapsed_time": "1:19:39", "remaining_time": "3:53:12", "throughput": 2363.12, "total_tokens": 11295440} {"current_steps": 276, "total_steps": 1080, "loss": 0.1538, "lr": 4.2366459261474933e-05, "epoch": 5.018348623853211, "percentage": 25.56, "elapsed_time": "1:19:57", "remaining_time": "3:52:55", "throughput": 2362.97, "total_tokens": 11336400} {"current_steps": 277, "total_steps": 1080, "loss": 0.1319, "lr": 4.231407399484236e-05, "epoch": 5.036697247706422, "percentage": 25.65, "elapsed_time": "1:20:14", "remaining_time": "3:52:36", "throughput": 2362.59, "total_tokens": 11374056} {"current_steps": 278, "total_steps": 1080, "loss": 0.174, "lr": 4.226154222363124e-05, "epoch": 5.055045871559633, "percentage": 25.74, "elapsed_time": "1:20:32", "remaining_time": "3:52:22", "throughput": 2361.95, "total_tokens": 11414776} {"current_steps": 279, "total_steps": 1080, "loss": 0.1831, "lr": 4.220886439234385e-05, "epoch": 5.073394495412844, "percentage": 25.83, "elapsed_time": "1:20:53", "remaining_time": "3:52:15", "throughput": 2362.15, "total_tokens": 11465456} {"current_steps": 280, "total_steps": 1080, "loss": 0.1515, "lr": 4.215604094671835e-05, "epoch": 5.091743119266055, "percentage": 25.93, "elapsed_time": "1:21:07", "remaining_time": "3:51:46", "throughput": 2362.75, "total_tokens": 11500184} {"current_steps": 281, "total_steps": 1080, "loss": 0.1295, "lr": 4.2103072333725e-05, "epoch": 5.110091743119266, "percentage": 26.02, "elapsed_time": "1:21:20", "remaining_time": "3:51:18", "throughput": 2363.7, "total_tokens": 11537112} {"current_steps": 282, "total_steps": 1080, "loss": 0.1339, "lr": 4.2049959001562464e-05, "epoch": 5.128440366972477, "percentage": 26.11, "elapsed_time": "1:21:39", "remaining_time": "3:51:05", "throughput": 2363.2, "total_tokens": 11579440} {"current_steps": 283, "total_steps": 1080, "loss": 0.1909, "lr": 4.199670139965393e-05, "epoch": 5.146788990825688, "percentage": 26.2, "elapsed_time": "1:22:08", "remaining_time": "3:51:21", "throughput": 2362.2, "total_tokens": 11643272} {"current_steps": 284, "total_steps": 1080, "loss": 0.2334, "lr": 4.194329997864331e-05, "epoch": 5.165137614678899, "percentage": 26.3, "elapsed_time": "1:22:23", "remaining_time": "3:50:54", "throughput": 2362.34, "total_tokens": 11677528} {"current_steps": 285, "total_steps": 1080, "loss": 0.1406, "lr": 4.188975519039151e-05, "epoch": 5.18348623853211, "percentage": 26.39, "elapsed_time": "1:22:43", "remaining_time": "3:50:45", "throughput": 2362.77, "total_tokens": 11727944} {"current_steps": 286, "total_steps": 1080, "loss": 0.138, "lr": 4.183606748797251e-05, "epoch": 5.201834862385321, "percentage": 26.48, "elapsed_time": "1:23:07", "remaining_time": "3:50:47", "throughput": 2361.69, "total_tokens": 11779568} {"current_steps": 287, "total_steps": 1080, "loss": 0.159, "lr": 4.1782237325669595e-05, "epoch": 5.220183486238533, "percentage": 26.57, "elapsed_time": "1:23:25", "remaining_time": "3:50:29", "throughput": 2362.42, "total_tokens": 11824600} {"current_steps": 288, "total_steps": 1080, "loss": 0.2517, "lr": 4.172826515897146e-05, "epoch": 5.238532110091743, "percentage": 26.67, "elapsed_time": "1:23:45", "remaining_time": "3:50:19", "throughput": 2362.76, "total_tokens": 11873736} {"current_steps": 289, "total_steps": 1080, "loss": 0.1349, "lr": 4.167415144456841e-05, "epoch": 5.256880733944954, "percentage": 26.76, "elapsed_time": "1:24:00", "remaining_time": "3:49:55", "throughput": 2362.83, "total_tokens": 11909608} {"current_steps": 290, "total_steps": 1080, "loss": 0.1348, "lr": 4.1619896640348445e-05, "epoch": 5.275229357798165, "percentage": 26.85, "elapsed_time": "1:24:15", "remaining_time": "3:49:30", "throughput": 2363.03, "total_tokens": 11945440} {"current_steps": 291, "total_steps": 1080, "loss": 0.1331, "lr": 4.1565501205393445e-05, "epoch": 5.293577981651376, "percentage": 26.94, "elapsed_time": "1:24:32", "remaining_time": "3:49:12", "throughput": 2363.02, "total_tokens": 11985568} {"current_steps": 292, "total_steps": 1080, "loss": 0.2337, "lr": 4.1510965599975196e-05, "epoch": 5.3119266055045875, "percentage": 27.04, "elapsed_time": "1:24:51", "remaining_time": "3:49:00", "throughput": 2363.5, "total_tokens": 12034320} {"current_steps": 293, "total_steps": 1080, "loss": 0.1299, "lr": 4.1456290285551596e-05, "epoch": 5.330275229357798, "percentage": 27.13, "elapsed_time": "1:25:06", "remaining_time": "3:48:35", "throughput": 2363.71, "total_tokens": 12070184} {"current_steps": 294, "total_steps": 1080, "loss": 0.1239, "lr": 4.140147572476268e-05, "epoch": 5.348623853211009, "percentage": 27.22, "elapsed_time": "1:25:22", "remaining_time": "3:48:15", "throughput": 2364.24, "total_tokens": 12111512} {"current_steps": 295, "total_steps": 1080, "loss": 0.133, "lr": 4.1346522381426744e-05, "epoch": 5.36697247706422, "percentage": 27.31, "elapsed_time": "1:25:43", "remaining_time": "3:48:07", "throughput": 2363.35, "total_tokens": 12156792} {"current_steps": 296, "total_steps": 1080, "loss": 0.1301, "lr": 4.129143072053638e-05, "epoch": 5.385321100917431, "percentage": 27.41, "elapsed_time": "1:25:55", "remaining_time": "3:47:34", "throughput": 2363.69, "total_tokens": 12185168} {"current_steps": 297, "total_steps": 1080, "loss": 0.1298, "lr": 4.123620120825459e-05, "epoch": 5.4036697247706424, "percentage": 27.5, "elapsed_time": "1:26:10", "remaining_time": "3:47:10", "throughput": 2363.92, "total_tokens": 12222256} {"current_steps": 298, "total_steps": 1080, "loss": 0.2088, "lr": 4.118083431191081e-05, "epoch": 5.422018348623853, "percentage": 27.59, "elapsed_time": "1:26:25", "remaining_time": "3:46:48", "throughput": 2363.6, "total_tokens": 12257536} {"current_steps": 299, "total_steps": 1080, "loss": 0.1062, "lr": 4.112533049999696e-05, "epoch": 5.440366972477064, "percentage": 27.69, "elapsed_time": "1:26:39", "remaining_time": "3:46:20", "throughput": 2363.97, "total_tokens": 12290576} {"current_steps": 300, "total_steps": 1080, "loss": 0.1989, "lr": 4.1069690242163484e-05, "epoch": 5.458715596330276, "percentage": 27.78, "elapsed_time": "1:26:54", "remaining_time": "3:45:56", "throughput": 2363.43, "total_tokens": 12323416} {"current_steps": 301, "total_steps": 1080, "loss": 0.1243, "lr": 4.101391400921538e-05, "epoch": 5.477064220183486, "percentage": 27.87, "elapsed_time": "1:27:14", "remaining_time": "3:45:46", "throughput": 2363.3, "total_tokens": 12370264} {"current_steps": 302, "total_steps": 1080, "loss": 0.2281, "lr": 4.095800227310821e-05, "epoch": 5.495412844036697, "percentage": 27.96, "elapsed_time": "1:27:32", "remaining_time": "3:45:30", "throughput": 2363.0, "total_tokens": 12410568} {"current_steps": 303, "total_steps": 1080, "loss": 0.1462, "lr": 4.09019555069441e-05, "epoch": 5.513761467889909, "percentage": 28.06, "elapsed_time": "1:27:45", "remaining_time": "3:45:03", "throughput": 2362.87, "total_tokens": 12442880} {"current_steps": 304, "total_steps": 1080, "loss": 0.1497, "lr": 4.0845774184967754e-05, "epoch": 5.532110091743119, "percentage": 28.15, "elapsed_time": "1:28:05", "remaining_time": "3:44:51", "throughput": 2362.53, "total_tokens": 12487016} {"current_steps": 305, "total_steps": 1080, "loss": 0.2082, "lr": 4.078945878256244e-05, "epoch": 5.5504587155963305, "percentage": 28.24, "elapsed_time": "1:28:22", "remaining_time": "3:44:33", "throughput": 2362.18, "total_tokens": 12525072} {"current_steps": 306, "total_steps": 1080, "loss": 0.1214, "lr": 4.073300977624594e-05, "epoch": 5.568807339449541, "percentage": 28.33, "elapsed_time": "1:28:35", "remaining_time": "3:44:04", "throughput": 2362.2, "total_tokens": 12555792} {"current_steps": 307, "total_steps": 1080, "loss": 0.1278, "lr": 4.067642764366654e-05, "epoch": 5.587155963302752, "percentage": 28.43, "elapsed_time": "1:28:54", "remaining_time": "3:43:52", "throughput": 2362.14, "total_tokens": 12601616} {"current_steps": 308, "total_steps": 1080, "loss": 0.1485, "lr": 4.0619712863599e-05, "epoch": 5.605504587155964, "percentage": 28.52, "elapsed_time": "1:29:09", "remaining_time": "3:43:27", "throughput": 2362.0, "total_tokens": 12634360} {"current_steps": 309, "total_steps": 1080, "loss": 0.1221, "lr": 4.0562865915940496e-05, "epoch": 5.623853211009174, "percentage": 28.61, "elapsed_time": "1:29:25", "remaining_time": "3:43:08", "throughput": 2362.18, "total_tokens": 12674808} {"current_steps": 310, "total_steps": 1080, "loss": 0.1388, "lr": 4.05058872817065e-05, "epoch": 5.6422018348623855, "percentage": 28.7, "elapsed_time": "1:29:41", "remaining_time": "3:42:47", "throughput": 2361.8, "total_tokens": 12710864} {"current_steps": 311, "total_steps": 1080, "loss": 0.1349, "lr": 4.044877744302683e-05, "epoch": 5.660550458715596, "percentage": 28.8, "elapsed_time": "1:29:57", "remaining_time": "3:42:27", "throughput": 2362.21, "total_tokens": 12750920} {"current_steps": 312, "total_steps": 1080, "loss": 0.1555, "lr": 4.039153688314145e-05, "epoch": 5.678899082568807, "percentage": 28.89, "elapsed_time": "1:30:16", "remaining_time": "3:42:12", "throughput": 2361.34, "total_tokens": 12789488} {"current_steps": 313, "total_steps": 1080, "loss": 0.1063, "lr": 4.0334166086396484e-05, "epoch": 5.697247706422019, "percentage": 28.98, "elapsed_time": "1:30:34", "remaining_time": "3:41:57", "throughput": 2361.11, "total_tokens": 12831408} {"current_steps": 314, "total_steps": 1080, "loss": 0.127, "lr": 4.0276665538239996e-05, "epoch": 5.715596330275229, "percentage": 29.07, "elapsed_time": "1:30:50", "remaining_time": "3:41:36", "throughput": 2361.64, "total_tokens": 12872584} {"current_steps": 315, "total_steps": 1080, "loss": 0.1428, "lr": 4.021903572521802e-05, "epoch": 5.73394495412844, "percentage": 29.17, "elapsed_time": "1:31:05", "remaining_time": "3:41:12", "throughput": 2362.32, "total_tokens": 12910528} {"current_steps": 316, "total_steps": 1080, "loss": 0.1279, "lr": 4.0161277134970345e-05, "epoch": 5.752293577981652, "percentage": 29.26, "elapsed_time": "1:31:18", "remaining_time": "3:40:45", "throughput": 2362.54, "total_tokens": 12942800} {"current_steps": 317, "total_steps": 1080, "loss": 0.1459, "lr": 4.010339025622641e-05, "epoch": 5.770642201834862, "percentage": 29.35, "elapsed_time": "1:31:34", "remaining_time": "3:40:25", "throughput": 2363.86, "total_tokens": 12989136} {"current_steps": 318, "total_steps": 1080, "loss": 0.1429, "lr": 4.0045375578801214e-05, "epoch": 5.7889908256880735, "percentage": 29.44, "elapsed_time": "1:31:52", "remaining_time": "3:40:09", "throughput": 2364.63, "total_tokens": 13035472} {"current_steps": 319, "total_steps": 1080, "loss": 0.1257, "lr": 3.99872335935911e-05, "epoch": 5.807339449541285, "percentage": 29.54, "elapsed_time": "1:32:11", "remaining_time": "3:39:55", "throughput": 2363.82, "total_tokens": 13074952} {"current_steps": 320, "total_steps": 1080, "loss": 0.1807, "lr": 3.9928964792569655e-05, "epoch": 5.825688073394495, "percentage": 29.63, "elapsed_time": "1:32:33", "remaining_time": "3:39:48", "throughput": 2363.44, "total_tokens": 13124624} {"current_steps": 321, "total_steps": 1080, "loss": 0.1853, "lr": 3.9870569668783536e-05, "epoch": 5.844036697247707, "percentage": 29.72, "elapsed_time": "1:32:54", "remaining_time": "3:39:39", "throughput": 2363.02, "total_tokens": 13171464} {"current_steps": 322, "total_steps": 1080, "loss": 0.214, "lr": 3.981204871634827e-05, "epoch": 5.862385321100917, "percentage": 29.81, "elapsed_time": "1:33:14", "remaining_time": "3:39:30", "throughput": 2363.86, "total_tokens": 13225240} {"current_steps": 323, "total_steps": 1080, "loss": 0.1907, "lr": 3.9753402430444116e-05, "epoch": 5.8807339449541285, "percentage": 29.91, "elapsed_time": "1:33:36", "remaining_time": "3:39:23", "throughput": 2363.68, "total_tokens": 13275848} {"current_steps": 324, "total_steps": 1080, "loss": 0.27, "lr": 3.969463130731183e-05, "epoch": 5.89908256880734, "percentage": 30.0, "elapsed_time": "1:33:50", "remaining_time": "3:38:58", "throughput": 2364.04, "total_tokens": 13311096} {"current_steps": 325, "total_steps": 1080, "loss": 0.1775, "lr": 3.963573584424852e-05, "epoch": 5.91743119266055, "percentage": 30.09, "elapsed_time": "1:34:16", "remaining_time": "3:39:00", "throughput": 2364.55, "total_tokens": 13375064} {"current_steps": 326, "total_steps": 1080, "loss": 0.1206, "lr": 3.957671653960337e-05, "epoch": 5.935779816513762, "percentage": 30.19, "elapsed_time": "1:34:38", "remaining_time": "3:38:53", "throughput": 2364.66, "total_tokens": 13427072} {"current_steps": 327, "total_steps": 1080, "loss": 0.1232, "lr": 3.9517573892773494e-05, "epoch": 5.954128440366972, "percentage": 30.28, "elapsed_time": "1:34:49", "remaining_time": "3:38:21", "throughput": 2364.74, "total_tokens": 13454088} {"current_steps": 328, "total_steps": 1080, "loss": 0.1696, "lr": 3.945830840419966e-05, "epoch": 5.972477064220183, "percentage": 30.37, "elapsed_time": "1:35:02", "remaining_time": "3:37:54", "throughput": 2364.94, "total_tokens": 13486504} {"current_steps": 329, "total_steps": 1080, "loss": 0.1055, "lr": 3.9398920575362086e-05, "epoch": 5.990825688073395, "percentage": 30.46, "elapsed_time": "1:35:17", "remaining_time": "3:37:30", "throughput": 2365.45, "total_tokens": 13523736} {"current_steps": 330, "total_steps": 1080, "loss": 0.2192, "lr": 3.933941090877615e-05, "epoch": 6.0, "percentage": 30.56, "elapsed_time": "1:35:32", "remaining_time": "3:37:08", "throughput": 2364.44, "total_tokens": 13554528} {"current_steps": 331, "total_steps": 1080, "loss": 0.1318, "lr": 3.9279779907988215e-05, "epoch": 6.018348623853211, "percentage": 30.65, "elapsed_time": "1:35:46", "remaining_time": "3:36:42", "throughput": 2364.62, "total_tokens": 13587424} {"current_steps": 332, "total_steps": 1080, "loss": 0.1136, "lr": 3.9220028077571295e-05, "epoch": 6.036697247706422, "percentage": 30.74, "elapsed_time": "1:36:00", "remaining_time": "3:36:18", "throughput": 2365.21, "total_tokens": 13624376} {"current_steps": 333, "total_steps": 1080, "loss": 0.0891, "lr": 3.916015592312082e-05, "epoch": 6.055045871559633, "percentage": 30.83, "elapsed_time": "1:36:12", "remaining_time": "3:35:48", "throughput": 2365.26, "total_tokens": 13652848} {"current_steps": 334, "total_steps": 1080, "loss": 0.1477, "lr": 3.910016395125037e-05, "epoch": 6.073394495412844, "percentage": 30.93, "elapsed_time": "1:36:45", "remaining_time": "3:36:06", "throughput": 2363.23, "total_tokens": 13719880} {"current_steps": 335, "total_steps": 1080, "loss": 0.0943, "lr": 3.9040052669587325e-05, "epoch": 6.091743119266055, "percentage": 31.02, "elapsed_time": "1:37:03", "remaining_time": "3:35:51", "throughput": 2363.56, "total_tokens": 13764864} {"current_steps": 336, "total_steps": 1080, "loss": 0.1039, "lr": 3.897982258676867e-05, "epoch": 6.110091743119266, "percentage": 31.11, "elapsed_time": "1:37:17", "remaining_time": "3:35:26", "throughput": 2363.12, "total_tokens": 13795048} {"current_steps": 337, "total_steps": 1080, "loss": 0.1294, "lr": 3.891947421243661e-05, "epoch": 6.128440366972477, "percentage": 31.2, "elapsed_time": "1:37:34", "remaining_time": "3:35:08", "throughput": 2362.19, "total_tokens": 13830064} {"current_steps": 338, "total_steps": 1080, "loss": 0.1233, "lr": 3.885900805723429e-05, "epoch": 6.146788990825688, "percentage": 31.3, "elapsed_time": "1:37:50", "remaining_time": "3:34:48", "throughput": 2362.59, "total_tokens": 13870392} {"current_steps": 339, "total_steps": 1080, "loss": 0.1252, "lr": 3.879842463280145e-05, "epoch": 6.165137614678899, "percentage": 31.39, "elapsed_time": "1:38:08", "remaining_time": "3:34:31", "throughput": 2362.69, "total_tokens": 13913144} {"current_steps": 340, "total_steps": 1080, "loss": 0.1191, "lr": 3.873772445177015e-05, "epoch": 6.18348623853211, "percentage": 31.48, "elapsed_time": "1:38:24", "remaining_time": "3:34:10", "throughput": 2362.7, "total_tokens": 13950384} {"current_steps": 341, "total_steps": 1080, "loss": 0.1028, "lr": 3.8676908027760364e-05, "epoch": 6.201834862385321, "percentage": 31.57, "elapsed_time": "1:38:41", "remaining_time": "3:33:52", "throughput": 2362.79, "total_tokens": 13990464} {"current_steps": 342, "total_steps": 1080, "loss": 0.0996, "lr": 3.861597587537568e-05, "epoch": 6.220183486238533, "percentage": 31.67, "elapsed_time": "1:38:55", "remaining_time": "3:33:29", "throughput": 2363.41, "total_tokens": 14029080} {"current_steps": 343, "total_steps": 1080, "loss": 0.172, "lr": 3.855492851019893e-05, "epoch": 6.238532110091743, "percentage": 31.76, "elapsed_time": "1:39:12", "remaining_time": "3:33:10", "throughput": 2363.66, "total_tokens": 14069824} {"current_steps": 344, "total_steps": 1080, "loss": 0.1244, "lr": 3.8493766448787825e-05, "epoch": 6.256880733944954, "percentage": 31.85, "elapsed_time": "1:39:29", "remaining_time": "3:32:51", "throughput": 2363.42, "total_tokens": 14107616} {"current_steps": 345, "total_steps": 1080, "loss": 0.1584, "lr": 3.84324902086706e-05, "epoch": 6.275229357798165, "percentage": 31.94, "elapsed_time": "1:39:46", "remaining_time": "3:32:33", "throughput": 2363.16, "total_tokens": 14146224} {"current_steps": 346, "total_steps": 1080, "loss": 0.1154, "lr": 3.837110030834161e-05, "epoch": 6.293577981651376, "percentage": 32.04, "elapsed_time": "1:40:00", "remaining_time": "3:32:08", "throughput": 2363.96, "total_tokens": 14183880} {"current_steps": 347, "total_steps": 1080, "loss": 0.098, "lr": 3.830959726725697e-05, "epoch": 6.3119266055045875, "percentage": 32.13, "elapsed_time": "1:40:13", "remaining_time": "3:31:43", "throughput": 2363.75, "total_tokens": 14214632} {"current_steps": 348, "total_steps": 1080, "loss": 0.2212, "lr": 3.824798160583012e-05, "epoch": 6.330275229357798, "percentage": 32.22, "elapsed_time": "1:40:33", "remaining_time": "3:31:31", "throughput": 2363.89, "total_tokens": 14263168} {"current_steps": 349, "total_steps": 1080, "loss": 0.1423, "lr": 3.81862538454275e-05, "epoch": 6.348623853211009, "percentage": 32.31, "elapsed_time": "1:40:50", "remaining_time": "3:31:13", "throughput": 2363.98, "total_tokens": 14303680} {"current_steps": 350, "total_steps": 1080, "loss": 0.1119, "lr": 3.8124414508364e-05, "epoch": 6.36697247706422, "percentage": 32.41, "elapsed_time": "1:41:09", "remaining_time": "3:30:58", "throughput": 2363.99, "total_tokens": 14347672} {"current_steps": 351, "total_steps": 1080, "loss": 0.1068, "lr": 3.8062464117898724e-05, "epoch": 6.385321100917431, "percentage": 32.5, "elapsed_time": "1:41:27", "remaining_time": "3:30:43", "throughput": 2364.56, "total_tokens": 14394848} {"current_steps": 352, "total_steps": 1080, "loss": 0.1051, "lr": 3.8000403198230387e-05, "epoch": 6.4036697247706424, "percentage": 32.59, "elapsed_time": "1:41:48", "remaining_time": "3:30:33", "throughput": 2363.67, "total_tokens": 14438856} {"current_steps": 353, "total_steps": 1080, "loss": 0.2208, "lr": 3.7938232274493e-05, "epoch": 6.422018348623853, "percentage": 32.69, "elapsed_time": "1:42:16", "remaining_time": "3:30:37", "throughput": 2362.62, "total_tokens": 14498032} {"current_steps": 354, "total_steps": 1080, "loss": 0.1131, "lr": 3.787595187275136e-05, "epoch": 6.440366972477064, "percentage": 32.78, "elapsed_time": "1:42:31", "remaining_time": "3:30:16", "throughput": 2362.64, "total_tokens": 14534256} {"current_steps": 355, "total_steps": 1080, "loss": 0.1207, "lr": 3.781356251999663e-05, "epoch": 6.458715596330276, "percentage": 32.87, "elapsed_time": "1:42:49", "remaining_time": "3:29:58", "throughput": 2362.56, "total_tokens": 14575016} {"current_steps": 356, "total_steps": 1080, "loss": 0.0887, "lr": 3.775106474414188e-05, "epoch": 6.477064220183486, "percentage": 32.96, "elapsed_time": "1:43:10", "remaining_time": "3:29:50", "throughput": 2362.74, "total_tokens": 14627272} {"current_steps": 357, "total_steps": 1080, "loss": 0.1022, "lr": 3.7688459074017606e-05, "epoch": 6.495412844036697, "percentage": 33.06, "elapsed_time": "1:43:23", "remaining_time": "3:29:23", "throughput": 2362.87, "total_tokens": 14658696} {"current_steps": 358, "total_steps": 1080, "loss": 0.1582, "lr": 3.762574603936725e-05, "epoch": 6.513761467889909, "percentage": 33.15, "elapsed_time": "1:43:41", "remaining_time": "3:29:06", "throughput": 2363.28, "total_tokens": 14702208} {"current_steps": 359, "total_steps": 1080, "loss": 0.0855, "lr": 3.756292617084275e-05, "epoch": 6.532110091743119, "percentage": 33.24, "elapsed_time": "1:44:02", "remaining_time": "3:28:57", "throughput": 2363.89, "total_tokens": 14757376} {"current_steps": 360, "total_steps": 1080, "loss": 0.1923, "lr": 3.7500000000000003e-05, "epoch": 6.5504587155963305, "percentage": 33.33, "elapsed_time": "1:44:19", "remaining_time": "3:28:38", "throughput": 2363.88, "total_tokens": 14796592} {"current_steps": 361, "total_steps": 1080, "loss": 0.1125, "lr": 3.7436968059294414e-05, "epoch": 6.568807339449541, "percentage": 33.43, "elapsed_time": "1:44:35", "remaining_time": "3:28:19", "throughput": 2363.74, "total_tokens": 14834656} {"current_steps": 362, "total_steps": 1080, "loss": 0.1947, "lr": 3.7373830882076354e-05, "epoch": 6.587155963302752, "percentage": 33.52, "elapsed_time": "1:44:49", "remaining_time": "3:27:55", "throughput": 2364.11, "total_tokens": 14869528} {"current_steps": 363, "total_steps": 1080, "loss": 0.1173, "lr": 3.731058900258668e-05, "epoch": 6.605504587155964, "percentage": 33.61, "elapsed_time": "1:45:07", "remaining_time": "3:27:37", "throughput": 2363.95, "total_tokens": 14909720} {"current_steps": 364, "total_steps": 1080, "loss": 0.1523, "lr": 3.7247242955952175e-05, "epoch": 6.623853211009174, "percentage": 33.7, "elapsed_time": "1:45:24", "remaining_time": "3:27:20", "throughput": 2364.19, "total_tokens": 14952704} {"current_steps": 365, "total_steps": 1080, "loss": 0.1313, "lr": 3.718379327818106e-05, "epoch": 6.6422018348623855, "percentage": 33.8, "elapsed_time": "1:45:41", "remaining_time": "3:27:02", "throughput": 2363.79, "total_tokens": 14989640} {"current_steps": 366, "total_steps": 1080, "loss": 0.0985, "lr": 3.712024050615843e-05, "epoch": 6.660550458715596, "percentage": 33.89, "elapsed_time": "1:45:58", "remaining_time": "3:26:45", "throughput": 2363.33, "total_tokens": 15028200} {"current_steps": 367, "total_steps": 1080, "loss": 0.1905, "lr": 3.705658517764172e-05, "epoch": 6.678899082568807, "percentage": 33.98, "elapsed_time": "1:46:19", "remaining_time": "3:26:34", "throughput": 2363.15, "total_tokens": 15075960} {"current_steps": 368, "total_steps": 1080, "loss": 0.1166, "lr": 3.699282783125616e-05, "epoch": 6.697247706422019, "percentage": 34.07, "elapsed_time": "1:46:34", "remaining_time": "3:26:12", "throughput": 2363.33, "total_tokens": 15113096} {"current_steps": 369, "total_steps": 1080, "loss": 0.138, "lr": 3.692896900649021e-05, "epoch": 6.715596330275229, "percentage": 34.17, "elapsed_time": "1:46:57", "remaining_time": "3:26:04", "throughput": 2362.83, "total_tokens": 15162432} {"current_steps": 370, "total_steps": 1080, "loss": 0.1612, "lr": 3.686500924369101e-05, "epoch": 6.73394495412844, "percentage": 34.26, "elapsed_time": "1:47:12", "remaining_time": "3:25:44", "throughput": 2363.43, "total_tokens": 15203656} {"current_steps": 371, "total_steps": 1080, "loss": 0.1131, "lr": 3.680094908405978e-05, "epoch": 6.752293577981652, "percentage": 34.35, "elapsed_time": "1:47:33", "remaining_time": "3:25:32", "throughput": 2363.35, "total_tokens": 15251056} {"current_steps": 372, "total_steps": 1080, "loss": 0.1264, "lr": 3.673678906964727e-05, "epoch": 6.770642201834862, "percentage": 34.44, "elapsed_time": "1:47:46", "remaining_time": "3:25:07", "throughput": 2363.4, "total_tokens": 15283552} {"current_steps": 373, "total_steps": 1080, "loss": 0.1167, "lr": 3.6672529743349146e-05, "epoch": 6.7889908256880735, "percentage": 34.54, "elapsed_time": "1:48:11", "remaining_time": "3:25:05", "throughput": 2362.77, "total_tokens": 15338944} {"current_steps": 374, "total_steps": 1080, "loss": 0.131, "lr": 3.660817164890143e-05, "epoch": 6.807339449541285, "percentage": 34.63, "elapsed_time": "1:48:24", "remaining_time": "3:24:39", "throughput": 2362.85, "total_tokens": 15369936} {"current_steps": 375, "total_steps": 1080, "loss": 0.095, "lr": 3.654371533087586e-05, "epoch": 6.825688073394495, "percentage": 34.72, "elapsed_time": "1:48:41", "remaining_time": "3:24:19", "throughput": 2363.34, "total_tokens": 15411576} {"current_steps": 376, "total_steps": 1080, "loss": 0.0937, "lr": 3.6479161334675296e-05, "epoch": 6.844036697247707, "percentage": 34.81, "elapsed_time": "1:48:59", "remaining_time": "3:24:04", "throughput": 2363.66, "total_tokens": 15457520} {"current_steps": 377, "total_steps": 1080, "loss": 0.1017, "lr": 3.641451020652914e-05, "epoch": 6.862385321100917, "percentage": 34.91, "elapsed_time": "1:49:11", "remaining_time": "3:23:37", "throughput": 2363.59, "total_tokens": 15485536} {"current_steps": 378, "total_steps": 1080, "loss": 0.1075, "lr": 3.634976249348867e-05, "epoch": 6.8807339449541285, "percentage": 35.0, "elapsed_time": "1:49:28", "remaining_time": "3:23:18", "throughput": 2363.78, "total_tokens": 15526704} {"current_steps": 379, "total_steps": 1080, "loss": 0.132, "lr": 3.6284918743422425e-05, "epoch": 6.89908256880734, "percentage": 35.09, "elapsed_time": "1:49:47", "remaining_time": "3:23:04", "throughput": 2363.1, "total_tokens": 15567344} {"current_steps": 380, "total_steps": 1080, "loss": 0.1435, "lr": 3.621997950501156e-05, "epoch": 6.91743119266055, "percentage": 35.19, "elapsed_time": "1:50:04", "remaining_time": "3:22:45", "throughput": 2363.44, "total_tokens": 15608408} {"current_steps": 381, "total_steps": 1080, "loss": 0.0958, "lr": 3.615494532774522e-05, "epoch": 6.935779816513762, "percentage": 35.28, "elapsed_time": "1:50:30", "remaining_time": "3:22:44", "throughput": 2362.94, "total_tokens": 15667496} {"current_steps": 382, "total_steps": 1080, "loss": 0.1465, "lr": 3.6089816761915906e-05, "epoch": 6.954128440366972, "percentage": 35.37, "elapsed_time": "1:50:50", "remaining_time": "3:22:31", "throughput": 2363.14, "total_tokens": 15715496} {"current_steps": 383, "total_steps": 1080, "loss": 0.1111, "lr": 3.602459435861475e-05, "epoch": 6.972477064220183, "percentage": 35.46, "elapsed_time": "1:51:05", "remaining_time": "3:22:10", "throughput": 2363.7, "total_tokens": 15755688} {"current_steps": 384, "total_steps": 1080, "loss": 0.1084, "lr": 3.5959278669726935e-05, "epoch": 6.990825688073395, "percentage": 35.56, "elapsed_time": "1:51:23", "remaining_time": "3:21:54", "throughput": 2363.62, "total_tokens": 15798304} {"current_steps": 385, "total_steps": 1080, "loss": 0.1234, "lr": 3.589387024792699e-05, "epoch": 7.0, "percentage": 35.65, "elapsed_time": "1:51:31", "remaining_time": "3:21:19", "throughput": 2363.23, "total_tokens": 15813616} {"current_steps": 386, "total_steps": 1080, "loss": 0.1167, "lr": 3.582836964667408e-05, "epoch": 7.018348623853211, "percentage": 35.74, "elapsed_time": "1:51:50", "remaining_time": "3:21:05", "throughput": 2362.72, "total_tokens": 15855256} {"current_steps": 387, "total_steps": 1080, "loss": 0.0829, "lr": 3.576277742020738e-05, "epoch": 7.036697247706422, "percentage": 35.83, "elapsed_time": "1:52:04", "remaining_time": "3:20:41", "throughput": 2362.64, "total_tokens": 15887512} {"current_steps": 388, "total_steps": 1080, "loss": 0.1213, "lr": 3.569709412354136e-05, "epoch": 7.055045871559633, "percentage": 35.93, "elapsed_time": "1:52:22", "remaining_time": "3:20:26", "throughput": 2363.14, "total_tokens": 15934400} {"current_steps": 389, "total_steps": 1080, "loss": 0.0914, "lr": 3.563132031246108e-05, "epoch": 7.073394495412844, "percentage": 36.02, "elapsed_time": "1:52:37", "remaining_time": "3:20:04", "throughput": 2363.14, "total_tokens": 15969904} {"current_steps": 390, "total_steps": 1080, "loss": 0.09, "lr": 3.556545654351749e-05, "epoch": 7.091743119266055, "percentage": 36.11, "elapsed_time": "1:52:55", "remaining_time": "3:19:47", "throughput": 2362.96, "total_tokens": 16010760} {"current_steps": 391, "total_steps": 1080, "loss": 0.0832, "lr": 3.549950337402274e-05, "epoch": 7.110091743119266, "percentage": 36.2, "elapsed_time": "1:53:14", "remaining_time": "3:19:32", "throughput": 2363.68, "total_tokens": 16059680} {"current_steps": 392, "total_steps": 1080, "loss": 0.079, "lr": 3.543346136204545e-05, "epoch": 7.128440366972477, "percentage": 36.3, "elapsed_time": "1:53:30", "remaining_time": "3:19:12", "throughput": 2363.51, "total_tokens": 16095992} {"current_steps": 393, "total_steps": 1080, "loss": 0.1, "lr": 3.536733106640598e-05, "epoch": 7.146788990825688, "percentage": 36.39, "elapsed_time": "1:53:47", "remaining_time": "3:18:54", "throughput": 2363.43, "total_tokens": 16135568} {"current_steps": 394, "total_steps": 1080, "loss": 0.0962, "lr": 3.5301113046671714e-05, "epoch": 7.165137614678899, "percentage": 36.48, "elapsed_time": "1:54:00", "remaining_time": "3:18:30", "throughput": 2363.05, "total_tokens": 16165016} {"current_steps": 395, "total_steps": 1080, "loss": 0.0923, "lr": 3.523480786315231e-05, "epoch": 7.18348623853211, "percentage": 36.57, "elapsed_time": "1:54:18", "remaining_time": "3:18:14", "throughput": 2363.15, "total_tokens": 16208344} {"current_steps": 396, "total_steps": 1080, "loss": 0.101, "lr": 3.516841607689501e-05, "epoch": 7.201834862385321, "percentage": 36.67, "elapsed_time": "1:54:35", "remaining_time": "3:17:55", "throughput": 2362.74, "total_tokens": 16244312} {"current_steps": 397, "total_steps": 1080, "loss": 0.1124, "lr": 3.5101938249679794e-05, "epoch": 7.220183486238533, "percentage": 36.76, "elapsed_time": "1:54:51", "remaining_time": "3:17:36", "throughput": 2362.81, "total_tokens": 16283848} {"current_steps": 398, "total_steps": 1080, "loss": 0.1054, "lr": 3.503537494401473e-05, "epoch": 7.238532110091743, "percentage": 36.85, "elapsed_time": "1:55:12", "remaining_time": "3:17:25", "throughput": 2363.19, "total_tokens": 16336288} {"current_steps": 399, "total_steps": 1080, "loss": 0.1781, "lr": 3.496872672313116e-05, "epoch": 7.256880733944954, "percentage": 36.94, "elapsed_time": "1:55:30", "remaining_time": "3:17:08", "throughput": 2362.87, "total_tokens": 16375448} {"current_steps": 400, "total_steps": 1080, "loss": 0.0935, "lr": 3.490199415097892e-05, "epoch": 7.275229357798165, "percentage": 37.04, "elapsed_time": "1:55:45", "remaining_time": "3:16:47", "throughput": 2363.04, "total_tokens": 16412608} {"current_steps": 401, "total_steps": 1080, "loss": 0.0944, "lr": 3.483517779222163e-05, "epoch": 7.293577981651376, "percentage": 37.13, "elapsed_time": "1:56:01", "remaining_time": "3:16:27", "throughput": 2363.86, "total_tokens": 16455904} {"current_steps": 402, "total_steps": 1080, "loss": 0.0878, "lr": 3.476827821223184e-05, "epoch": 7.3119266055045875, "percentage": 37.22, "elapsed_time": "1:56:18", "remaining_time": "3:16:08", "throughput": 2364.1, "total_tokens": 16496824} {"current_steps": 403, "total_steps": 1080, "loss": 0.0911, "lr": 3.4701295977086324e-05, "epoch": 7.330275229357798, "percentage": 37.31, "elapsed_time": "1:56:30", "remaining_time": "3:15:43", "throughput": 2364.53, "total_tokens": 16529344} {"current_steps": 404, "total_steps": 1080, "loss": 0.1047, "lr": 3.463423165356121e-05, "epoch": 7.348623853211009, "percentage": 37.41, "elapsed_time": "1:56:44", "remaining_time": "3:15:21", "throughput": 2364.55, "total_tokens": 16563664} {"current_steps": 405, "total_steps": 1080, "loss": 0.1228, "lr": 3.456708580912725e-05, "epoch": 7.36697247706422, "percentage": 37.5, "elapsed_time": "1:57:01", "remaining_time": "3:15:02", "throughput": 2365.19, "total_tokens": 16607272} {"current_steps": 406, "total_steps": 1080, "loss": 0.1801, "lr": 3.449985901194498e-05, "epoch": 7.385321100917431, "percentage": 37.59, "elapsed_time": "1:57:19", "remaining_time": "3:14:45", "throughput": 2364.78, "total_tokens": 16646040} {"current_steps": 407, "total_steps": 1080, "loss": 0.0883, "lr": 3.443255183085993e-05, "epoch": 7.4036697247706424, "percentage": 37.69, "elapsed_time": "1:57:38", "remaining_time": "3:14:31", "throughput": 2365.1, "total_tokens": 16693544} {"current_steps": 408, "total_steps": 1080, "loss": 0.083, "lr": 3.436516483539781e-05, "epoch": 7.422018348623853, "percentage": 37.78, "elapsed_time": "1:58:01", "remaining_time": "3:14:23", "throughput": 2364.23, "total_tokens": 16742128} {"current_steps": 409, "total_steps": 1080, "loss": 0.1247, "lr": 3.4297698595759664e-05, "epoch": 7.440366972477064, "percentage": 37.87, "elapsed_time": "1:58:22", "remaining_time": "3:14:12", "throughput": 2364.2, "total_tokens": 16792000} {"current_steps": 410, "total_steps": 1080, "loss": 0.0948, "lr": 3.423015368281711e-05, "epoch": 7.458715596330276, "percentage": 37.96, "elapsed_time": "1:58:35", "remaining_time": "3:13:48", "throughput": 2364.32, "total_tokens": 16824312} {"current_steps": 411, "total_steps": 1080, "loss": 0.0993, "lr": 3.4162530668107434e-05, "epoch": 7.477064220183486, "percentage": 38.06, "elapsed_time": "1:58:50", "remaining_time": "3:13:26", "throughput": 2363.93, "total_tokens": 16856344} {"current_steps": 412, "total_steps": 1080, "loss": 0.1273, "lr": 3.409483012382879e-05, "epoch": 7.495412844036697, "percentage": 38.15, "elapsed_time": "1:59:09", "remaining_time": "3:13:11", "throughput": 2363.72, "total_tokens": 16898256} {"current_steps": 413, "total_steps": 1080, "loss": 0.1171, "lr": 3.402705262283537e-05, "epoch": 7.513761467889909, "percentage": 38.24, "elapsed_time": "1:59:27", "remaining_time": "3:12:54", "throughput": 2363.51, "total_tokens": 16939304} {"current_steps": 414, "total_steps": 1080, "loss": 0.1753, "lr": 3.39591987386325e-05, "epoch": 7.532110091743119, "percentage": 38.33, "elapsed_time": "1:59:43", "remaining_time": "3:12:36", "throughput": 2363.44, "total_tokens": 16978632} {"current_steps": 415, "total_steps": 1080, "loss": 0.1567, "lr": 3.389126904537192e-05, "epoch": 7.5504587155963305, "percentage": 38.43, "elapsed_time": "2:00:00", "remaining_time": "3:12:17", "throughput": 2363.29, "total_tokens": 17016552} {"current_steps": 416, "total_steps": 1080, "loss": 0.0941, "lr": 3.382326411784672e-05, "epoch": 7.568807339449541, "percentage": 38.52, "elapsed_time": "2:00:21", "remaining_time": "3:12:07", "throughput": 2363.34, "total_tokens": 17067688} {"current_steps": 417, "total_steps": 1080, "loss": 0.0961, "lr": 3.375518453148669e-05, "epoch": 7.587155963302752, "percentage": 38.61, "elapsed_time": "2:00:46", "remaining_time": "3:12:02", "throughput": 2363.21, "total_tokens": 17126008} {"current_steps": 418, "total_steps": 1080, "loss": 0.1974, "lr": 3.3687030862353286e-05, "epoch": 7.605504587155964, "percentage": 38.7, "elapsed_time": "2:01:05", "remaining_time": "3:11:46", "throughput": 2362.77, "total_tokens": 17165800} {"current_steps": 419, "total_steps": 1080, "loss": 0.094, "lr": 3.361880368713486e-05, "epoch": 7.623853211009174, "percentage": 38.8, "elapsed_time": "2:01:19", "remaining_time": "3:11:23", "throughput": 2362.93, "total_tokens": 17199832} {"current_steps": 420, "total_steps": 1080, "loss": 0.0717, "lr": 3.355050358314172e-05, "epoch": 7.6422018348623855, "percentage": 38.89, "elapsed_time": "2:01:35", "remaining_time": "3:11:03", "throughput": 2362.93, "total_tokens": 17237952} {"current_steps": 421, "total_steps": 1080, "loss": 0.0943, "lr": 3.348213112830128e-05, "epoch": 7.660550458715596, "percentage": 38.98, "elapsed_time": "2:01:52", "remaining_time": "3:10:46", "throughput": 2362.81, "total_tokens": 17278384} {"current_steps": 422, "total_steps": 1080, "loss": 0.0814, "lr": 3.3413686901153165e-05, "epoch": 7.678899082568807, "percentage": 39.07, "elapsed_time": "2:02:05", "remaining_time": "3:10:21", "throughput": 2362.98, "total_tokens": 17309544} {"current_steps": 423, "total_steps": 1080, "loss": 0.1192, "lr": 3.3345171480844275e-05, "epoch": 7.697247706422019, "percentage": 39.17, "elapsed_time": "2:02:19", "remaining_time": "3:09:59", "throughput": 2363.28, "total_tokens": 17344896} {"current_steps": 424, "total_steps": 1080, "loss": 0.104, "lr": 3.327658544712395e-05, "epoch": 7.715596330275229, "percentage": 39.26, "elapsed_time": "2:02:50", "remaining_time": "3:10:03", "throughput": 2362.48, "total_tokens": 17413176} {"current_steps": 425, "total_steps": 1080, "loss": 0.0965, "lr": 3.3207929380339034e-05, "epoch": 7.73394495412844, "percentage": 39.35, "elapsed_time": "2:03:06", "remaining_time": "3:09:43", "throughput": 2362.53, "total_tokens": 17450416} {"current_steps": 426, "total_steps": 1080, "loss": 0.0775, "lr": 3.313920386142892e-05, "epoch": 7.752293577981652, "percentage": 39.44, "elapsed_time": "2:03:23", "remaining_time": "3:09:25", "throughput": 2362.65, "total_tokens": 17491256} {"current_steps": 427, "total_steps": 1080, "loss": 0.1651, "lr": 3.3070409471920726e-05, "epoch": 7.770642201834862, "percentage": 39.54, "elapsed_time": "2:03:36", "remaining_time": "3:09:02", "throughput": 2362.42, "total_tokens": 17521600} {"current_steps": 428, "total_steps": 1080, "loss": 0.1071, "lr": 3.3001546793924285e-05, "epoch": 7.7889908256880735, "percentage": 39.63, "elapsed_time": "2:03:56", "remaining_time": "3:08:47", "throughput": 2362.04, "total_tokens": 17564288} {"current_steps": 429, "total_steps": 1080, "loss": 0.0987, "lr": 3.293261641012731e-05, "epoch": 7.807339449541285, "percentage": 39.72, "elapsed_time": "2:04:11", "remaining_time": "3:08:27", "throughput": 2362.46, "total_tokens": 17604304} {"current_steps": 430, "total_steps": 1080, "loss": 0.1743, "lr": 3.2863618903790346e-05, "epoch": 7.825688073394495, "percentage": 39.81, "elapsed_time": "2:04:27", "remaining_time": "3:08:08", "throughput": 2362.39, "total_tokens": 17641384} {"current_steps": 431, "total_steps": 1080, "loss": 0.0854, "lr": 3.279455485874195e-05, "epoch": 7.844036697247707, "percentage": 39.91, "elapsed_time": "2:04:44", "remaining_time": "3:07:50", "throughput": 2362.17, "total_tokens": 17680560} {"current_steps": 432, "total_steps": 1080, "loss": 0.0949, "lr": 3.272542485937369e-05, "epoch": 7.862385321100917, "percentage": 40.0, "elapsed_time": "2:04:59", "remaining_time": "3:07:29", "throughput": 2362.24, "total_tokens": 17715312} {"current_steps": 433, "total_steps": 1080, "loss": 0.1377, "lr": 3.26562294906352e-05, "epoch": 7.8807339449541285, "percentage": 40.09, "elapsed_time": "2:05:21", "remaining_time": "3:07:18", "throughput": 2362.14, "total_tokens": 17766056} {"current_steps": 434, "total_steps": 1080, "loss": 0.1035, "lr": 3.2586969338029274e-05, "epoch": 7.89908256880734, "percentage": 40.19, "elapsed_time": "2:05:38", "remaining_time": "3:07:01", "throughput": 2362.37, "total_tokens": 17809040} {"current_steps": 435, "total_steps": 1080, "loss": 0.0844, "lr": 3.251764498760683e-05, "epoch": 7.91743119266055, "percentage": 40.28, "elapsed_time": "2:05:57", "remaining_time": "3:06:45", "throughput": 2362.84, "total_tokens": 17856896} {"current_steps": 436, "total_steps": 1080, "loss": 0.1295, "lr": 3.244825702596205e-05, "epoch": 7.935779816513762, "percentage": 40.37, "elapsed_time": "2:06:25", "remaining_time": "3:06:43", "throughput": 2362.14, "total_tokens": 17917200} {"current_steps": 437, "total_steps": 1080, "loss": 0.0662, "lr": 3.237880604022735e-05, "epoch": 7.954128440366972, "percentage": 40.46, "elapsed_time": "2:06:47", "remaining_time": "3:06:34", "throughput": 2361.76, "total_tokens": 17967840} {"current_steps": 438, "total_steps": 1080, "loss": 0.087, "lr": 3.230929261806842e-05, "epoch": 7.972477064220183, "percentage": 40.56, "elapsed_time": "2:07:01", "remaining_time": "3:06:11", "throughput": 2361.88, "total_tokens": 18001712} {"current_steps": 439, "total_steps": 1080, "loss": 0.0808, "lr": 3.223971734767928e-05, "epoch": 7.990825688073395, "percentage": 40.65, "elapsed_time": "2:07:20", "remaining_time": "3:05:56", "throughput": 2361.75, "total_tokens": 18044712} {"current_steps": 440, "total_steps": 1080, "loss": 0.09, "lr": 3.217008081777726e-05, "epoch": 8.0, "percentage": 40.74, "elapsed_time": "2:07:31", "remaining_time": "3:05:28", "throughput": 2362.09, "total_tokens": 18072704} {"current_steps": 441, "total_steps": 1080, "loss": 0.0775, "lr": 3.210038361759807e-05, "epoch": 8.01834862385321, "percentage": 40.83, "elapsed_time": "2:07:42", "remaining_time": "3:05:03", "throughput": 2362.54, "total_tokens": 18103680} {"current_steps": 442, "total_steps": 1080, "loss": 0.0667, "lr": 3.203062633689077e-05, "epoch": 8.036697247706423, "percentage": 40.93, "elapsed_time": "2:07:55", "remaining_time": "3:04:39", "throughput": 2362.45, "total_tokens": 18133248} {"current_steps": 443, "total_steps": 1080, "loss": 0.0616, "lr": 3.1960809565912794e-05, "epoch": 8.055045871559633, "percentage": 41.02, "elapsed_time": "2:08:18", "remaining_time": "3:04:30", "throughput": 2362.12, "total_tokens": 18185672} {"current_steps": 444, "total_steps": 1080, "loss": 0.0909, "lr": 3.1890933895424976e-05, "epoch": 8.073394495412844, "percentage": 41.11, "elapsed_time": "2:08:36", "remaining_time": "3:04:12", "throughput": 2362.39, "total_tokens": 18228240} {"current_steps": 445, "total_steps": 1080, "loss": 0.0688, "lr": 3.182099991668653e-05, "epoch": 8.091743119266056, "percentage": 41.2, "elapsed_time": "2:08:53", "remaining_time": "3:03:55", "throughput": 2362.66, "total_tokens": 18271416} {"current_steps": 446, "total_steps": 1080, "loss": 0.1181, "lr": 3.1751008221450025e-05, "epoch": 8.110091743119266, "percentage": 41.3, "elapsed_time": "2:09:10", "remaining_time": "3:03:36", "throughput": 2363.11, "total_tokens": 18314208} {"current_steps": 447, "total_steps": 1080, "loss": 0.1408, "lr": 3.168095940195642e-05, "epoch": 8.128440366972477, "percentage": 41.39, "elapsed_time": "2:09:32", "remaining_time": "3:03:27", "throughput": 2363.67, "total_tokens": 18372552} {"current_steps": 448, "total_steps": 1080, "loss": 0.0613, "lr": 3.161085405093006e-05, "epoch": 8.146788990825687, "percentage": 41.48, "elapsed_time": "2:09:51", "remaining_time": "3:03:11", "throughput": 2363.87, "total_tokens": 18418048} {"current_steps": 449, "total_steps": 1080, "loss": 0.071, "lr": 3.154069276157359e-05, "epoch": 8.1651376146789, "percentage": 41.57, "elapsed_time": "2:10:08", "remaining_time": "3:02:53", "throughput": 2364.08, "total_tokens": 18459656} {"current_steps": 450, "total_steps": 1080, "loss": 0.0781, "lr": 3.147047612756302e-05, "epoch": 8.18348623853211, "percentage": 41.67, "elapsed_time": "2:10:21", "remaining_time": "3:02:29", "throughput": 2364.0, "total_tokens": 18489056} {"current_steps": 451, "total_steps": 1080, "loss": 0.1724, "lr": 3.140020474304265e-05, "epoch": 8.20183486238532, "percentage": 41.76, "elapsed_time": "2:10:42", "remaining_time": "3:02:17", "throughput": 2363.54, "total_tokens": 18536296} {"current_steps": 452, "total_steps": 1080, "loss": 0.072, "lr": 3.132987920262005e-05, "epoch": 8.220183486238533, "percentage": 41.85, "elapsed_time": "2:10:56", "remaining_time": "3:01:55", "throughput": 2363.7, "total_tokens": 18569984} {"current_steps": 453, "total_steps": 1080, "loss": 0.0831, "lr": 3.125950010136104e-05, "epoch": 8.238532110091743, "percentage": 41.94, "elapsed_time": "2:11:10", "remaining_time": "3:01:33", "throughput": 2363.42, "total_tokens": 18600496} {"current_steps": 454, "total_steps": 1080, "loss": 0.0763, "lr": 3.118906803478465e-05, "epoch": 8.256880733944953, "percentage": 42.04, "elapsed_time": "2:11:29", "remaining_time": "3:01:18", "throughput": 2363.19, "total_tokens": 18644784} {"current_steps": 455, "total_steps": 1080, "loss": 0.0693, "lr": 3.11185835988581e-05, "epoch": 8.275229357798166, "percentage": 42.13, "elapsed_time": "2:11:44", "remaining_time": "3:00:57", "throughput": 2363.58, "total_tokens": 18682928} {"current_steps": 456, "total_steps": 1080, "loss": 0.069, "lr": 3.104804738999169e-05, "epoch": 8.293577981651376, "percentage": 42.22, "elapsed_time": "2:12:07", "remaining_time": "3:00:48", "throughput": 2363.36, "total_tokens": 18735736} {"current_steps": 457, "total_steps": 1080, "loss": 0.0716, "lr": 3.097746000503386e-05, "epoch": 8.311926605504587, "percentage": 42.31, "elapsed_time": "2:12:25", "remaining_time": "3:00:31", "throughput": 2363.47, "total_tokens": 18779416} {"current_steps": 458, "total_steps": 1080, "loss": 0.081, "lr": 3.090682204126604e-05, "epoch": 8.330275229357799, "percentage": 42.41, "elapsed_time": "2:12:38", "remaining_time": "3:00:08", "throughput": 2363.79, "total_tokens": 18813088} {"current_steps": 459, "total_steps": 1080, "loss": 0.088, "lr": 3.083613409639764e-05, "epoch": 8.34862385321101, "percentage": 42.5, "elapsed_time": "2:12:50", "remaining_time": "2:59:44", "throughput": 2363.45, "total_tokens": 18838800} {"current_steps": 460, "total_steps": 1080, "loss": 0.0616, "lr": 3.076539676856101e-05, "epoch": 8.36697247706422, "percentage": 42.59, "elapsed_time": "2:13:10", "remaining_time": "2:59:29", "throughput": 2363.21, "total_tokens": 18882128} {"current_steps": 461, "total_steps": 1080, "loss": 0.0685, "lr": 3.069461065630634e-05, "epoch": 8.385321100917432, "percentage": 42.69, "elapsed_time": "2:13:29", "remaining_time": "2:59:14", "throughput": 2363.18, "total_tokens": 18927120} {"current_steps": 462, "total_steps": 1080, "loss": 0.1019, "lr": 3.062377635859663e-05, "epoch": 8.403669724770642, "percentage": 42.78, "elapsed_time": "2:13:47", "remaining_time": "2:58:58", "throughput": 2362.87, "total_tokens": 18968240} {"current_steps": 463, "total_steps": 1080, "loss": 0.1115, "lr": 3.0552894474802584e-05, "epoch": 8.422018348623853, "percentage": 42.87, "elapsed_time": "2:14:08", "remaining_time": "2:58:45", "throughput": 2362.4, "total_tokens": 19013248} {"current_steps": 464, "total_steps": 1080, "loss": 0.0648, "lr": 3.048196560469758e-05, "epoch": 8.440366972477065, "percentage": 42.96, "elapsed_time": "2:14:26", "remaining_time": "2:58:29", "throughput": 2362.6, "total_tokens": 19058904} {"current_steps": 465, "total_steps": 1080, "loss": 0.0678, "lr": 3.0410990348452573e-05, "epoch": 8.458715596330276, "percentage": 43.06, "elapsed_time": "2:14:44", "remaining_time": "2:58:11", "throughput": 2363.03, "total_tokens": 19103128} {"current_steps": 466, "total_steps": 1080, "loss": 0.1322, "lr": 3.0339969306631005e-05, "epoch": 8.477064220183486, "percentage": 43.15, "elapsed_time": "2:15:00", "remaining_time": "2:57:53", "throughput": 2363.27, "total_tokens": 19144648} {"current_steps": 467, "total_steps": 1080, "loss": 0.0935, "lr": 3.0268903080183743e-05, "epoch": 8.495412844036696, "percentage": 43.24, "elapsed_time": "2:15:17", "remaining_time": "2:57:35", "throughput": 2363.03, "total_tokens": 19182568} {"current_steps": 468, "total_steps": 1080, "loss": 0.1373, "lr": 3.0197792270443982e-05, "epoch": 8.513761467889909, "percentage": 43.33, "elapsed_time": "2:15:32", "remaining_time": "2:57:14", "throughput": 2363.22, "total_tokens": 19218336} {"current_steps": 469, "total_steps": 1080, "loss": 0.1189, "lr": 3.0126637479122193e-05, "epoch": 8.53211009174312, "percentage": 43.43, "elapsed_time": "2:15:50", "remaining_time": "2:56:58", "throughput": 2362.92, "total_tokens": 19258632} {"current_steps": 470, "total_steps": 1080, "loss": 0.0683, "lr": 3.0055439308300952e-05, "epoch": 8.55045871559633, "percentage": 43.52, "elapsed_time": "2:16:05", "remaining_time": "2:56:37", "throughput": 2363.26, "total_tokens": 19296928} {"current_steps": 471, "total_steps": 1080, "loss": 0.0766, "lr": 2.9984198360429932e-05, "epoch": 8.568807339449542, "percentage": 43.61, "elapsed_time": "2:16:23", "remaining_time": "2:56:21", "throughput": 2363.05, "total_tokens": 19338416} {"current_steps": 472, "total_steps": 1080, "loss": 0.1101, "lr": 2.9912915238320754e-05, "epoch": 8.587155963302752, "percentage": 43.7, "elapsed_time": "2:16:46", "remaining_time": "2:56:11", "throughput": 2363.02, "total_tokens": 19392040} {"current_steps": 473, "total_steps": 1080, "loss": 0.0811, "lr": 2.9841590545141906e-05, "epoch": 8.605504587155963, "percentage": 43.8, "elapsed_time": "2:17:02", "remaining_time": "2:55:52", "throughput": 2363.05, "total_tokens": 19430360} {"current_steps": 474, "total_steps": 1080, "loss": 0.0665, "lr": 2.9770224884413623e-05, "epoch": 8.623853211009175, "percentage": 43.89, "elapsed_time": "2:17:27", "remaining_time": "2:55:44", "throughput": 2362.76, "total_tokens": 19487640} {"current_steps": 475, "total_steps": 1080, "loss": 0.0856, "lr": 2.9698818860002797e-05, "epoch": 8.642201834862385, "percentage": 43.98, "elapsed_time": "2:17:41", "remaining_time": "2:55:22", "throughput": 2362.88, "total_tokens": 19520352} {"current_steps": 476, "total_steps": 1080, "loss": 0.0709, "lr": 2.9627373076117863e-05, "epoch": 8.660550458715596, "percentage": 44.07, "elapsed_time": "2:18:03", "remaining_time": "2:55:10", "throughput": 2362.69, "total_tokens": 19570472} {"current_steps": 477, "total_steps": 1080, "loss": 0.0774, "lr": 2.9555888137303695e-05, "epoch": 8.678899082568808, "percentage": 44.17, "elapsed_time": "2:18:15", "remaining_time": "2:54:46", "throughput": 2362.88, "total_tokens": 19600648} {"current_steps": 478, "total_steps": 1080, "loss": 0.0758, "lr": 2.9484364648436437e-05, "epoch": 8.697247706422019, "percentage": 44.26, "elapsed_time": "2:18:34", "remaining_time": "2:54:31", "throughput": 2363.13, "total_tokens": 19649200} {"current_steps": 479, "total_steps": 1080, "loss": 0.0833, "lr": 2.941280321471848e-05, "epoch": 8.715596330275229, "percentage": 44.35, "elapsed_time": "2:18:47", "remaining_time": "2:54:09", "throughput": 2363.18, "total_tokens": 19680328} {"current_steps": 480, "total_steps": 1080, "loss": 0.0763, "lr": 2.9341204441673266e-05, "epoch": 8.73394495412844, "percentage": 44.44, "elapsed_time": "2:19:06", "remaining_time": "2:53:53", "throughput": 2363.63, "total_tokens": 19728296} {"current_steps": 481, "total_steps": 1080, "loss": 0.1141, "lr": 2.9269568935140174e-05, "epoch": 8.752293577981652, "percentage": 44.54, "elapsed_time": "2:19:21", "remaining_time": "2:53:32", "throughput": 2363.87, "total_tokens": 19764920} {"current_steps": 482, "total_steps": 1080, "loss": 0.137, "lr": 2.9197897301269435e-05, "epoch": 8.770642201834862, "percentage": 44.63, "elapsed_time": "2:19:38", "remaining_time": "2:53:15", "throughput": 2363.92, "total_tokens": 19806568} {"current_steps": 483, "total_steps": 1080, "loss": 0.059, "lr": 2.9126190146516942e-05, "epoch": 8.788990825688073, "percentage": 44.72, "elapsed_time": "2:19:56", "remaining_time": "2:52:58", "throughput": 2364.15, "total_tokens": 19851352} {"current_steps": 484, "total_steps": 1080, "loss": 0.0993, "lr": 2.905444807763919e-05, "epoch": 8.807339449541285, "percentage": 44.81, "elapsed_time": "2:20:15", "remaining_time": "2:52:42", "throughput": 2364.52, "total_tokens": 19897640} {"current_steps": 485, "total_steps": 1080, "loss": 0.0721, "lr": 2.898267170168807e-05, "epoch": 8.825688073394495, "percentage": 44.91, "elapsed_time": "2:20:30", "remaining_time": "2:52:22", "throughput": 2364.86, "total_tokens": 19936472} {"current_steps": 486, "total_steps": 1080, "loss": 0.0875, "lr": 2.8910861626005776e-05, "epoch": 8.844036697247706, "percentage": 45.0, "elapsed_time": "2:20:43", "remaining_time": "2:52:00", "throughput": 2364.75, "total_tokens": 19967128} {"current_steps": 487, "total_steps": 1080, "loss": 0.0784, "lr": 2.8839018458219653e-05, "epoch": 8.862385321100918, "percentage": 45.09, "elapsed_time": "2:21:03", "remaining_time": "2:51:45", "throughput": 2364.25, "total_tokens": 20010472} {"current_steps": 488, "total_steps": 1080, "loss": 0.0949, "lr": 2.876714280623708e-05, "epoch": 8.880733944954128, "percentage": 45.19, "elapsed_time": "2:21:24", "remaining_time": "2:51:32", "throughput": 2364.06, "total_tokens": 20056984} {"current_steps": 489, "total_steps": 1080, "loss": 0.0718, "lr": 2.8695235278240272e-05, "epoch": 8.899082568807339, "percentage": 45.28, "elapsed_time": "2:21:44", "remaining_time": "2:51:18", "throughput": 2364.14, "total_tokens": 20105712} {"current_steps": 490, "total_steps": 1080, "loss": 0.0904, "lr": 2.8623296482681166e-05, "epoch": 8.917431192660551, "percentage": 45.37, "elapsed_time": "2:22:00", "remaining_time": "2:50:58", "throughput": 2364.65, "total_tokens": 20147136} {"current_steps": 491, "total_steps": 1080, "loss": 0.0652, "lr": 2.8551327028276314e-05, "epoch": 8.935779816513762, "percentage": 45.46, "elapsed_time": "2:22:17", "remaining_time": "2:50:41", "throughput": 2364.98, "total_tokens": 20190008} {"current_steps": 492, "total_steps": 1080, "loss": 0.1347, "lr": 2.8479327524001636e-05, "epoch": 8.954128440366972, "percentage": 45.56, "elapsed_time": "2:22:35", "remaining_time": "2:50:25", "throughput": 2365.11, "total_tokens": 20235552} {"current_steps": 493, "total_steps": 1080, "loss": 0.0642, "lr": 2.8407298579087365e-05, "epoch": 8.972477064220184, "percentage": 45.65, "elapsed_time": "2:22:55", "remaining_time": "2:50:11", "throughput": 2364.59, "total_tokens": 20278504} {"current_steps": 494, "total_steps": 1080, "loss": 0.0689, "lr": 2.833524080301282e-05, "epoch": 8.990825688073395, "percentage": 45.74, "elapsed_time": "2:23:11", "remaining_time": "2:49:51", "throughput": 2364.38, "total_tokens": 20314024} {"current_steps": 495, "total_steps": 1080, "loss": 0.0735, "lr": 2.8263154805501297e-05, "epoch": 9.0, "percentage": 45.83, "elapsed_time": "2:23:19", "remaining_time": "2:49:22", "throughput": 2364.38, "total_tokens": 20331792} {"current_steps": 496, "total_steps": 1080, "loss": 0.0695, "lr": 2.8191041196514873e-05, "epoch": 9.01834862385321, "percentage": 45.93, "elapsed_time": "2:23:31", "remaining_time": "2:48:58", "throughput": 2364.34, "total_tokens": 20359504} {"current_steps": 497, "total_steps": 1080, "loss": 0.1075, "lr": 2.8118900586249263e-05, "epoch": 9.036697247706423, "percentage": 46.02, "elapsed_time": "2:23:45", "remaining_time": "2:48:38", "throughput": 2364.32, "total_tokens": 20393544} {"current_steps": 498, "total_steps": 1080, "loss": 0.0658, "lr": 2.8046733585128687e-05, "epoch": 9.055045871559633, "percentage": 46.11, "elapsed_time": "2:23:56", "remaining_time": "2:48:13", "throughput": 2364.38, "total_tokens": 20419560} {"current_steps": 499, "total_steps": 1080, "loss": 0.0581, "lr": 2.7974540803800637e-05, "epoch": 9.073394495412844, "percentage": 46.2, "elapsed_time": "2:24:14", "remaining_time": "2:47:56", "throughput": 2364.54, "total_tokens": 20462936} {"current_steps": 500, "total_steps": 1080, "loss": 0.0845, "lr": 2.7902322853130757e-05, "epoch": 9.091743119266056, "percentage": 46.3, "elapsed_time": "2:24:26", "remaining_time": "2:47:32", "throughput": 2364.83, "total_tokens": 20494032} {"current_steps": 501, "total_steps": 1080, "loss": 0.0543, "lr": 2.7830080344197674e-05, "epoch": 9.110091743119266, "percentage": 46.39, "elapsed_time": "2:24:54", "remaining_time": "2:47:27", "throughput": 2363.96, "total_tokens": 20553072} {"current_steps": 502, "total_steps": 1080, "loss": 0.2288, "lr": 2.7757813888287798e-05, "epoch": 9.128440366972477, "percentage": 46.48, "elapsed_time": "2:25:15", "remaining_time": "2:47:14", "throughput": 2364.33, "total_tokens": 20605784} {"current_steps": 503, "total_steps": 1080, "loss": 0.0636, "lr": 2.7685524096890185e-05, "epoch": 9.146788990825687, "percentage": 46.57, "elapsed_time": "2:25:34", "remaining_time": "2:46:59", "throughput": 2364.51, "total_tokens": 20651856} {"current_steps": 504, "total_steps": 1080, "loss": 0.0524, "lr": 2.761321158169134e-05, "epoch": 9.1651376146789, "percentage": 46.67, "elapsed_time": "2:25:52", "remaining_time": "2:46:42", "throughput": 2364.77, "total_tokens": 20696944} {"current_steps": 505, "total_steps": 1080, "loss": 0.0652, "lr": 2.7540876954570048e-05, "epoch": 9.18348623853211, "percentage": 46.76, "elapsed_time": "2:26:04", "remaining_time": "2:46:19", "throughput": 2365.05, "total_tokens": 20728072} {"current_steps": 506, "total_steps": 1080, "loss": 0.05, "lr": 2.7468520827592197e-05, "epoch": 9.20183486238532, "percentage": 46.85, "elapsed_time": "2:26:20", "remaining_time": "2:46:00", "throughput": 2364.98, "total_tokens": 20765264} {"current_steps": 507, "total_steps": 1080, "loss": 0.0763, "lr": 2.7396143813005602e-05, "epoch": 9.220183486238533, "percentage": 46.94, "elapsed_time": "2:26:36", "remaining_time": "2:45:41", "throughput": 2364.88, "total_tokens": 20803144} {"current_steps": 508, "total_steps": 1080, "loss": 0.0495, "lr": 2.732374652323481e-05, "epoch": 9.238532110091743, "percentage": 47.04, "elapsed_time": "2:26:57", "remaining_time": "2:45:28", "throughput": 2365.47, "total_tokens": 20857912} {"current_steps": 509, "total_steps": 1080, "loss": 0.0518, "lr": 2.7251329570875934e-05, "epoch": 9.256880733944953, "percentage": 47.13, "elapsed_time": "2:27:16", "remaining_time": "2:45:13", "throughput": 2365.31, "total_tokens": 20901536} {"current_steps": 510, "total_steps": 1080, "loss": 0.0605, "lr": 2.717889356869146e-05, "epoch": 9.275229357798166, "percentage": 47.22, "elapsed_time": "2:27:35", "remaining_time": "2:44:56", "throughput": 2365.27, "total_tokens": 20944592} {"current_steps": 511, "total_steps": 1080, "loss": 0.056, "lr": 2.7106439129605072e-05, "epoch": 9.293577981651376, "percentage": 47.31, "elapsed_time": "2:27:49", "remaining_time": "2:44:35", "throughput": 2365.7, "total_tokens": 20981640} {"current_steps": 512, "total_steps": 1080, "loss": 0.0661, "lr": 2.7033966866696457e-05, "epoch": 9.311926605504587, "percentage": 47.41, "elapsed_time": "2:28:02", "remaining_time": "2:44:13", "throughput": 2365.6, "total_tokens": 21011280} {"current_steps": 513, "total_steps": 1080, "loss": 0.0735, "lr": 2.6961477393196126e-05, "epoch": 9.330275229357799, "percentage": 47.5, "elapsed_time": "2:28:20", "remaining_time": "2:43:57", "throughput": 2365.7, "total_tokens": 21056896} {"current_steps": 514, "total_steps": 1080, "loss": 0.0541, "lr": 2.6888971322480205e-05, "epoch": 9.34862385321101, "percentage": 47.59, "elapsed_time": "2:28:36", "remaining_time": "2:43:38", "throughput": 2366.0, "total_tokens": 21096440} {"current_steps": 515, "total_steps": 1080, "loss": 0.1135, "lr": 2.681644926806527e-05, "epoch": 9.36697247706422, "percentage": 47.69, "elapsed_time": "2:28:54", "remaining_time": "2:43:21", "throughput": 2365.76, "total_tokens": 21136776} {"current_steps": 516, "total_steps": 1080, "loss": 0.0572, "lr": 2.674391184360313e-05, "epoch": 9.385321100917432, "percentage": 47.78, "elapsed_time": "2:29:10", "remaining_time": "2:43:03", "throughput": 2365.97, "total_tokens": 21177016} {"current_steps": 517, "total_steps": 1080, "loss": 0.0465, "lr": 2.6671359662875684e-05, "epoch": 9.403669724770642, "percentage": 47.87, "elapsed_time": "2:29:26", "remaining_time": "2:42:44", "throughput": 2366.21, "total_tokens": 21216216} {"current_steps": 518, "total_steps": 1080, "loss": 0.0596, "lr": 2.659879333978964e-05, "epoch": 9.422018348623853, "percentage": 47.96, "elapsed_time": "2:29:52", "remaining_time": "2:42:36", "throughput": 2366.17, "total_tokens": 21278344} {"current_steps": 519, "total_steps": 1080, "loss": 0.1131, "lr": 2.6526213488371427e-05, "epoch": 9.440366972477065, "percentage": 48.06, "elapsed_time": "2:30:15", "remaining_time": "2:42:24", "throughput": 2366.04, "total_tokens": 21330704} {"current_steps": 520, "total_steps": 1080, "loss": 0.0587, "lr": 2.6453620722761896e-05, "epoch": 9.458715596330276, "percentage": 48.15, "elapsed_time": "2:30:35", "remaining_time": "2:42:10", "throughput": 2365.98, "total_tokens": 21377568} {"current_steps": 521, "total_steps": 1080, "loss": 0.0529, "lr": 2.6381015657211215e-05, "epoch": 9.477064220183486, "percentage": 48.24, "elapsed_time": "2:30:54", "remaining_time": "2:41:54", "throughput": 2365.9, "total_tokens": 21421808} {"current_steps": 522, "total_steps": 1080, "loss": 0.0592, "lr": 2.63083989060736e-05, "epoch": 9.495412844036696, "percentage": 48.33, "elapsed_time": "2:31:13", "remaining_time": "2:41:39", "throughput": 2365.71, "total_tokens": 21465904} {"current_steps": 523, "total_steps": 1080, "loss": 0.0952, "lr": 2.623577108380215e-05, "epoch": 9.513761467889909, "percentage": 48.43, "elapsed_time": "2:31:31", "remaining_time": "2:41:22", "throughput": 2365.65, "total_tokens": 21507888} {"current_steps": 524, "total_steps": 1080, "loss": 0.0649, "lr": 2.6163132804943675e-05, "epoch": 9.53211009174312, "percentage": 48.52, "elapsed_time": "2:31:46", "remaining_time": "2:41:02", "throughput": 2365.52, "total_tokens": 21541544} {"current_steps": 525, "total_steps": 1080, "loss": 0.0557, "lr": 2.6090484684133404e-05, "epoch": 9.55045871559633, "percentage": 48.61, "elapsed_time": "2:31:59", "remaining_time": "2:40:40", "throughput": 2365.92, "total_tokens": 21576072} {"current_steps": 526, "total_steps": 1080, "loss": 0.1018, "lr": 2.60178273360899e-05, "epoch": 9.568807339449542, "percentage": 48.7, "elapsed_time": "2:32:20", "remaining_time": "2:40:27", "throughput": 2365.55, "total_tokens": 21623464} {"current_steps": 527, "total_steps": 1080, "loss": 0.0629, "lr": 2.5945161375609778e-05, "epoch": 9.587155963302752, "percentage": 48.8, "elapsed_time": "2:32:35", "remaining_time": "2:40:07", "throughput": 2365.31, "total_tokens": 21656096} {"current_steps": 528, "total_steps": 1080, "loss": 0.0725, "lr": 2.587248741756253e-05, "epoch": 9.605504587155963, "percentage": 48.89, "elapsed_time": "2:32:48", "remaining_time": "2:39:45", "throughput": 2365.18, "total_tokens": 21685872} {"current_steps": 529, "total_steps": 1080, "loss": 0.0605, "lr": 2.5799806076885326e-05, "epoch": 9.623853211009175, "percentage": 48.98, "elapsed_time": "2:33:14", "remaining_time": "2:39:36", "throughput": 2364.51, "total_tokens": 21740704} {"current_steps": 530, "total_steps": 1080, "loss": 0.0821, "lr": 2.5727117968577784e-05, "epoch": 9.642201834862385, "percentage": 49.07, "elapsed_time": "2:33:30", "remaining_time": "2:39:17", "throughput": 2364.29, "total_tokens": 21775920} {"current_steps": 531, "total_steps": 1080, "loss": 0.0622, "lr": 2.5654423707696833e-05, "epoch": 9.660550458715596, "percentage": 49.17, "elapsed_time": "2:33:51", "remaining_time": "2:39:04", "throughput": 2363.84, "total_tokens": 21822360} {"current_steps": 532, "total_steps": 1080, "loss": 0.066, "lr": 2.5581723909351406e-05, "epoch": 9.678899082568808, "percentage": 49.26, "elapsed_time": "2:34:10", "remaining_time": "2:38:49", "throughput": 2364.33, "total_tokens": 21872168} {"current_steps": 533, "total_steps": 1080, "loss": 0.0555, "lr": 2.5509019188697343e-05, "epoch": 9.697247706422019, "percentage": 49.35, "elapsed_time": "2:34:28", "remaining_time": "2:38:31", "throughput": 2364.42, "total_tokens": 21914080} {"current_steps": 534, "total_steps": 1080, "loss": 0.0605, "lr": 2.5436310160932092e-05, "epoch": 9.715596330275229, "percentage": 49.44, "elapsed_time": "2:34:47", "remaining_time": "2:38:16", "throughput": 2364.39, "total_tokens": 21959648} {"current_steps": 535, "total_steps": 1080, "loss": 0.0622, "lr": 2.536359744128957e-05, "epoch": 9.73394495412844, "percentage": 49.54, "elapsed_time": "2:35:04", "remaining_time": "2:37:58", "throughput": 2364.38, "total_tokens": 22000280} {"current_steps": 536, "total_steps": 1080, "loss": 0.1505, "lr": 2.5290881645034932e-05, "epoch": 9.752293577981652, "percentage": 49.63, "elapsed_time": "2:35:30", "remaining_time": "2:37:50", "throughput": 2364.08, "total_tokens": 22058744} {"current_steps": 537, "total_steps": 1080, "loss": 0.0939, "lr": 2.521816338745935e-05, "epoch": 9.770642201834862, "percentage": 49.72, "elapsed_time": "2:35:49", "remaining_time": "2:37:34", "throughput": 2364.03, "total_tokens": 22102616} {"current_steps": 538, "total_steps": 1080, "loss": 0.0507, "lr": 2.5145443283874848e-05, "epoch": 9.788990825688073, "percentage": 49.81, "elapsed_time": "2:36:05", "remaining_time": "2:37:15", "throughput": 2364.06, "total_tokens": 22141096} {"current_steps": 539, "total_steps": 1080, "loss": 0.0659, "lr": 2.5072721949609053e-05, "epoch": 9.807339449541285, "percentage": 49.91, "elapsed_time": "2:36:22", "remaining_time": "2:36:57", "throughput": 2363.98, "total_tokens": 22179672} {"current_steps": 540, "total_steps": 1080, "loss": 0.0683, "lr": 2.5e-05, "epoch": 9.825688073394495, "percentage": 50.0, "elapsed_time": "2:36:36", "remaining_time": "2:36:36", "throughput": 2364.15, "total_tokens": 22214744} {"current_steps": 541, "total_steps": 1080, "loss": 0.0633, "lr": 2.4927278050390956e-05, "epoch": 9.844036697247706, "percentage": 50.09, "elapsed_time": "2:36:55", "remaining_time": "2:36:21", "throughput": 2363.73, "total_tokens": 22256776} {"current_steps": 542, "total_steps": 1080, "loss": 0.1099, "lr": 2.485455671612515e-05, "epoch": 9.862385321100918, "percentage": 50.19, "elapsed_time": "2:37:13", "remaining_time": "2:36:04", "throughput": 2363.83, "total_tokens": 22300168} {"current_steps": 543, "total_steps": 1080, "loss": 0.0571, "lr": 2.4781836612540657e-05, "epoch": 9.880733944954128, "percentage": 50.28, "elapsed_time": "2:37:32", "remaining_time": "2:35:48", "throughput": 2363.84, "total_tokens": 22345376} {"current_steps": 544, "total_steps": 1080, "loss": 0.0552, "lr": 2.470911835496508e-05, "epoch": 9.899082568807339, "percentage": 50.37, "elapsed_time": "2:37:45", "remaining_time": "2:35:26", "throughput": 2363.74, "total_tokens": 22374072} {"current_steps": 545, "total_steps": 1080, "loss": 0.1122, "lr": 2.4636402558710432e-05, "epoch": 9.917431192660551, "percentage": 50.46, "elapsed_time": "2:38:02", "remaining_time": "2:35:08", "throughput": 2363.99, "total_tokens": 22415592} {"current_steps": 546, "total_steps": 1080, "loss": 0.0643, "lr": 2.4563689839067913e-05, "epoch": 9.935779816513762, "percentage": 50.56, "elapsed_time": "2:38:20", "remaining_time": "2:34:51", "throughput": 2363.87, "total_tokens": 22458208} {"current_steps": 547, "total_steps": 1080, "loss": 0.0535, "lr": 2.4490980811302656e-05, "epoch": 9.954128440366972, "percentage": 50.65, "elapsed_time": "2:38:36", "remaining_time": "2:34:33", "throughput": 2364.0, "total_tokens": 22497376} {"current_steps": 548, "total_steps": 1080, "loss": 0.1055, "lr": 2.4418276090648596e-05, "epoch": 9.972477064220184, "percentage": 50.74, "elapsed_time": "2:38:49", "remaining_time": "2:34:11", "throughput": 2364.56, "total_tokens": 22534016} {"current_steps": 549, "total_steps": 1080, "loss": 0.0527, "lr": 2.4345576292303176e-05, "epoch": 9.990825688073395, "percentage": 50.83, "elapsed_time": "2:39:07", "remaining_time": "2:33:54", "throughput": 2364.46, "total_tokens": 22573896} {"current_steps": 550, "total_steps": 1080, "loss": 0.0589, "lr": 2.4272882031422215e-05, "epoch": 10.0, "percentage": 50.93, "elapsed_time": "2:39:14", "remaining_time": "2:33:26", "throughput": 2364.44, "total_tokens": 22590880} {"current_steps": 551, "total_steps": 1080, "loss": 0.0605, "lr": 2.4200193923114683e-05, "epoch": 10.01834862385321, "percentage": 51.02, "elapsed_time": "2:39:30", "remaining_time": "2:33:08", "throughput": 2364.53, "total_tokens": 22629088} {"current_steps": 552, "total_steps": 1080, "loss": 0.0537, "lr": 2.4127512582437485e-05, "epoch": 10.036697247706423, "percentage": 51.11, "elapsed_time": "2:39:46", "remaining_time": "2:32:49", "throughput": 2364.54, "total_tokens": 22668208} {"current_steps": 553, "total_steps": 1080, "loss": 0.0458, "lr": 2.405483862439023e-05, "epoch": 10.055045871559633, "percentage": 51.2, "elapsed_time": "2:40:02", "remaining_time": "2:32:31", "throughput": 2364.67, "total_tokens": 22706992} {"current_steps": 554, "total_steps": 1080, "loss": 0.057, "lr": 2.3982172663910108e-05, "epoch": 10.073394495412844, "percentage": 51.3, "elapsed_time": "2:40:17", "remaining_time": "2:32:11", "throughput": 2364.48, "total_tokens": 22740280} {"current_steps": 555, "total_steps": 1080, "loss": 0.1281, "lr": 2.3909515315866605e-05, "epoch": 10.091743119266056, "percentage": 51.39, "elapsed_time": "2:40:34", "remaining_time": "2:31:53", "throughput": 2364.45, "total_tokens": 22779464} {"current_steps": 556, "total_steps": 1080, "loss": 0.0505, "lr": 2.3836867195056335e-05, "epoch": 10.110091743119266, "percentage": 51.48, "elapsed_time": "2:40:50", "remaining_time": "2:31:34", "throughput": 2364.66, "total_tokens": 22819232} {"current_steps": 557, "total_steps": 1080, "loss": 0.0533, "lr": 2.3764228916197855e-05, "epoch": 10.128440366972477, "percentage": 51.57, "elapsed_time": "2:41:06", "remaining_time": "2:31:16", "throughput": 2364.92, "total_tokens": 22860296} {"current_steps": 558, "total_steps": 1080, "loss": 0.0657, "lr": 2.3691601093926404e-05, "epoch": 10.146788990825687, "percentage": 51.67, "elapsed_time": "2:41:20", "remaining_time": "2:30:55", "throughput": 2365.13, "total_tokens": 22895040} {"current_steps": 559, "total_steps": 1080, "loss": 0.0448, "lr": 2.361898434278879e-05, "epoch": 10.1651376146789, "percentage": 51.76, "elapsed_time": "2:41:39", "remaining_time": "2:30:40", "throughput": 2365.06, "total_tokens": 22939848} {"current_steps": 560, "total_steps": 1080, "loss": 0.0511, "lr": 2.3546379277238107e-05, "epoch": 10.18348623853211, "percentage": 51.85, "elapsed_time": "2:42:00", "remaining_time": "2:30:26", "throughput": 2365.04, "total_tokens": 22990280} {"current_steps": 561, "total_steps": 1080, "loss": 0.0557, "lr": 2.3473786511628575e-05, "epoch": 10.20183486238532, "percentage": 51.94, "elapsed_time": "2:42:19", "remaining_time": "2:30:10", "throughput": 2365.11, "total_tokens": 23034808} {"current_steps": 562, "total_steps": 1080, "loss": 0.0481, "lr": 2.3401206660210363e-05, "epoch": 10.220183486238533, "percentage": 52.04, "elapsed_time": "2:42:40", "remaining_time": "2:29:56", "throughput": 2364.88, "total_tokens": 23082600} {"current_steps": 563, "total_steps": 1080, "loss": 0.0408, "lr": 2.3328640337124326e-05, "epoch": 10.238532110091743, "percentage": 52.13, "elapsed_time": "2:42:58", "remaining_time": "2:29:39", "throughput": 2364.84, "total_tokens": 23125248} {"current_steps": 564, "total_steps": 1080, "loss": 0.1393, "lr": 2.3256088156396868e-05, "epoch": 10.256880733944953, "percentage": 52.22, "elapsed_time": "2:43:17", "remaining_time": "2:29:23", "throughput": 2364.75, "total_tokens": 23169104} {"current_steps": 565, "total_steps": 1080, "loss": 0.0445, "lr": 2.3183550731934735e-05, "epoch": 10.275229357798166, "percentage": 52.31, "elapsed_time": "2:43:35", "remaining_time": "2:29:07", "throughput": 2364.84, "total_tokens": 23213000} {"current_steps": 566, "total_steps": 1080, "loss": 0.0491, "lr": 2.3111028677519804e-05, "epoch": 10.293577981651376, "percentage": 52.41, "elapsed_time": "2:43:51", "remaining_time": "2:28:48", "throughput": 2364.99, "total_tokens": 23252584} {"current_steps": 567, "total_steps": 1080, "loss": 0.0438, "lr": 2.303852260680388e-05, "epoch": 10.311926605504587, "percentage": 52.5, "elapsed_time": "2:44:09", "remaining_time": "2:28:31", "throughput": 2365.15, "total_tokens": 23294424} {"current_steps": 568, "total_steps": 1080, "loss": 0.0818, "lr": 2.2966033133303545e-05, "epoch": 10.330275229357799, "percentage": 52.59, "elapsed_time": "2:44:24", "remaining_time": "2:28:12", "throughput": 2365.2, "total_tokens": 23331696} {"current_steps": 569, "total_steps": 1080, "loss": 0.0733, "lr": 2.289356087039493e-05, "epoch": 10.34862385321101, "percentage": 52.69, "elapsed_time": "2:44:41", "remaining_time": "2:27:54", "throughput": 2364.99, "total_tokens": 23370592} {"current_steps": 570, "total_steps": 1080, "loss": 0.0576, "lr": 2.2821106431308544e-05, "epoch": 10.36697247706422, "percentage": 52.78, "elapsed_time": "2:44:58", "remaining_time": "2:27:36", "throughput": 2364.6, "total_tokens": 23406728} {"current_steps": 571, "total_steps": 1080, "loss": 0.0399, "lr": 2.274867042912408e-05, "epoch": 10.385321100917432, "percentage": 52.87, "elapsed_time": "2:45:20", "remaining_time": "2:27:23", "throughput": 2364.52, "total_tokens": 23456880} {"current_steps": 572, "total_steps": 1080, "loss": 0.1006, "lr": 2.2676253476765196e-05, "epoch": 10.403669724770642, "percentage": 52.96, "elapsed_time": "2:45:39", "remaining_time": "2:27:07", "throughput": 2364.46, "total_tokens": 23501632} {"current_steps": 573, "total_steps": 1080, "loss": 0.048, "lr": 2.26038561869944e-05, "epoch": 10.422018348623853, "percentage": 53.06, "elapsed_time": "2:45:59", "remaining_time": "2:26:52", "throughput": 2364.23, "total_tokens": 23546696} {"current_steps": 574, "total_steps": 1080, "loss": 0.038, "lr": 2.2531479172407805e-05, "epoch": 10.440366972477065, "percentage": 53.15, "elapsed_time": "2:46:16", "remaining_time": "2:26:34", "throughput": 2364.76, "total_tokens": 23590976} {"current_steps": 575, "total_steps": 1080, "loss": 0.0475, "lr": 2.2459123045429954e-05, "epoch": 10.458715596330276, "percentage": 53.24, "elapsed_time": "2:46:33", "remaining_time": "2:26:17", "throughput": 2364.64, "total_tokens": 23632096} {"current_steps": 576, "total_steps": 1080, "loss": 0.0385, "lr": 2.238678841830867e-05, "epoch": 10.477064220183486, "percentage": 53.33, "elapsed_time": "2:46:46", "remaining_time": "2:25:55", "throughput": 2364.69, "total_tokens": 23661968} {"current_steps": 577, "total_steps": 1080, "loss": 0.0602, "lr": 2.2314475903109825e-05, "epoch": 10.495412844036696, "percentage": 53.43, "elapsed_time": "2:47:07", "remaining_time": "2:25:41", "throughput": 2364.43, "total_tokens": 23709568} {"current_steps": 578, "total_steps": 1080, "loss": 0.0812, "lr": 2.2242186111712208e-05, "epoch": 10.513761467889909, "percentage": 53.52, "elapsed_time": "2:47:27", "remaining_time": "2:25:26", "throughput": 2363.79, "total_tokens": 23749216} {"current_steps": 579, "total_steps": 1080, "loss": 0.1103, "lr": 2.2169919655802335e-05, "epoch": 10.53211009174312, "percentage": 53.61, "elapsed_time": "2:47:42", "remaining_time": "2:25:07", "throughput": 2363.81, "total_tokens": 23786848} {"current_steps": 580, "total_steps": 1080, "loss": 0.048, "lr": 2.2097677146869242e-05, "epoch": 10.55045871559633, "percentage": 53.7, "elapsed_time": "2:47:59", "remaining_time": "2:24:48", "throughput": 2364.02, "total_tokens": 23827336} {"current_steps": 581, "total_steps": 1080, "loss": 0.1118, "lr": 2.202545919619937e-05, "epoch": 10.568807339449542, "percentage": 53.8, "elapsed_time": "2:48:22", "remaining_time": "2:24:36", "throughput": 2363.72, "total_tokens": 23880272} {"current_steps": 582, "total_steps": 1080, "loss": 0.0512, "lr": 2.195326641487132e-05, "epoch": 10.587155963302752, "percentage": 53.89, "elapsed_time": "2:48:40", "remaining_time": "2:24:19", "throughput": 2363.86, "total_tokens": 23923208} {"current_steps": 583, "total_steps": 1080, "loss": 0.0809, "lr": 2.1881099413750733e-05, "epoch": 10.605504587155963, "percentage": 53.98, "elapsed_time": "2:48:55", "remaining_time": "2:24:00", "throughput": 2364.21, "total_tokens": 23961424} {"current_steps": 584, "total_steps": 1080, "loss": 0.0446, "lr": 2.1808958803485136e-05, "epoch": 10.623853211009175, "percentage": 54.07, "elapsed_time": "2:49:10", "remaining_time": "2:23:40", "throughput": 2364.46, "total_tokens": 24000184} {"current_steps": 585, "total_steps": 1080, "loss": 0.0472, "lr": 2.173684519449872e-05, "epoch": 10.642201834862385, "percentage": 54.17, "elapsed_time": "2:49:29", "remaining_time": "2:23:24", "throughput": 2364.86, "total_tokens": 24049488} {"current_steps": 586, "total_steps": 1080, "loss": 0.0522, "lr": 2.1664759196987182e-05, "epoch": 10.660550458715596, "percentage": 54.26, "elapsed_time": "2:49:43", "remaining_time": "2:23:04", "throughput": 2365.16, "total_tokens": 24085104} {"current_steps": 587, "total_steps": 1080, "loss": 0.1182, "lr": 2.1592701420912644e-05, "epoch": 10.678899082568808, "percentage": 54.35, "elapsed_time": "2:50:02", "remaining_time": "2:22:48", "throughput": 2364.66, "total_tokens": 24124768} {"current_steps": 588, "total_steps": 1080, "loss": 0.0452, "lr": 2.1520672475998373e-05, "epoch": 10.697247706422019, "percentage": 54.44, "elapsed_time": "2:50:21", "remaining_time": "2:22:32", "throughput": 2364.49, "total_tokens": 24167872} {"current_steps": 589, "total_steps": 1080, "loss": 0.0586, "lr": 2.144867297172369e-05, "epoch": 10.715596330275229, "percentage": 54.54, "elapsed_time": "2:50:33", "remaining_time": "2:22:10", "throughput": 2364.69, "total_tokens": 24198824} {"current_steps": 590, "total_steps": 1080, "loss": 0.0547, "lr": 2.1376703517318837e-05, "epoch": 10.73394495412844, "percentage": 54.63, "elapsed_time": "2:50:51", "remaining_time": "2:21:53", "throughput": 2365.46, "total_tokens": 24249320} {"current_steps": 591, "total_steps": 1080, "loss": 0.0562, "lr": 2.1304764721759733e-05, "epoch": 10.752293577981652, "percentage": 54.72, "elapsed_time": "2:51:08", "remaining_time": "2:21:36", "throughput": 2365.7, "total_tokens": 24292592} {"current_steps": 592, "total_steps": 1080, "loss": 0.056, "lr": 2.1232857193762924e-05, "epoch": 10.770642201834862, "percentage": 54.81, "elapsed_time": "2:51:25", "remaining_time": "2:21:18", "throughput": 2365.61, "total_tokens": 24331648} {"current_steps": 593, "total_steps": 1080, "loss": 0.0538, "lr": 2.116098154178035e-05, "epoch": 10.788990825688073, "percentage": 54.91, "elapsed_time": "2:51:51", "remaining_time": "2:21:08", "throughput": 2364.96, "total_tokens": 24386904} {"current_steps": 594, "total_steps": 1080, "loss": 0.0924, "lr": 2.1089138373994223e-05, "epoch": 10.807339449541285, "percentage": 55.0, "elapsed_time": "2:52:11", "remaining_time": "2:20:53", "throughput": 2365.05, "total_tokens": 24435360} {"current_steps": 595, "total_steps": 1080, "loss": 0.0468, "lr": 2.101732829831194e-05, "epoch": 10.825688073394495, "percentage": 55.09, "elapsed_time": "2:52:25", "remaining_time": "2:20:32", "throughput": 2364.9, "total_tokens": 24465400} {"current_steps": 596, "total_steps": 1080, "loss": 0.057, "lr": 2.0945551922360818e-05, "epoch": 10.844036697247706, "percentage": 55.19, "elapsed_time": "2:52:38", "remaining_time": "2:20:11", "throughput": 2365.09, "total_tokens": 24497984} {"current_steps": 597, "total_steps": 1080, "loss": 0.0472, "lr": 2.087380985348306e-05, "epoch": 10.862385321100918, "percentage": 55.28, "elapsed_time": "2:52:53", "remaining_time": "2:19:52", "throughput": 2365.23, "total_tokens": 24534576} {"current_steps": 598, "total_steps": 1080, "loss": 0.0592, "lr": 2.0802102698730574e-05, "epoch": 10.880733944954128, "percentage": 55.37, "elapsed_time": "2:53:07", "remaining_time": "2:19:32", "throughput": 2365.48, "total_tokens": 24572160} {"current_steps": 599, "total_steps": 1080, "loss": 0.0392, "lr": 2.0730431064859836e-05, "epoch": 10.899082568807339, "percentage": 55.46, "elapsed_time": "2:53:29", "remaining_time": "2:19:18", "throughput": 2365.11, "total_tokens": 24619744} {"current_steps": 600, "total_steps": 1080, "loss": 0.048, "lr": 2.0658795558326743e-05, "epoch": 10.917431192660551, "percentage": 55.56, "elapsed_time": "2:53:51", "remaining_time": "2:19:05", "throughput": 2364.98, "total_tokens": 24671048} {"current_steps": 601, "total_steps": 1080, "loss": 0.0512, "lr": 2.0587196785281525e-05, "epoch": 10.935779816513762, "percentage": 55.65, "elapsed_time": "2:54:08", "remaining_time": "2:18:47", "throughput": 2365.03, "total_tokens": 24710152} {"current_steps": 602, "total_steps": 1080, "loss": 0.0466, "lr": 2.0515635351563565e-05, "epoch": 10.954128440366972, "percentage": 55.74, "elapsed_time": "2:54:23", "remaining_time": "2:18:28", "throughput": 2364.82, "total_tokens": 24744584} {"current_steps": 603, "total_steps": 1080, "loss": 0.0911, "lr": 2.0444111862696314e-05, "epoch": 10.972477064220184, "percentage": 55.83, "elapsed_time": "2:54:42", "remaining_time": "2:18:12", "throughput": 2364.75, "total_tokens": 24788584} {"current_steps": 604, "total_steps": 1080, "loss": 0.0516, "lr": 2.037262692388214e-05, "epoch": 10.990825688073395, "percentage": 55.93, "elapsed_time": "2:54:55", "remaining_time": "2:17:51", "throughput": 2365.09, "total_tokens": 24823152} {"current_steps": 605, "total_steps": 1080, "loss": 0.1007, "lr": 2.0301181139997205e-05, "epoch": 11.0, "percentage": 56.02, "elapsed_time": "2:55:07", "remaining_time": "2:17:29", "throughput": 2364.98, "total_tokens": 24849968} {"current_steps": 606, "total_steps": 1080, "loss": 0.0425, "lr": 2.022977511558638e-05, "epoch": 11.01834862385321, "percentage": 56.11, "elapsed_time": "2:55:26", "remaining_time": "2:17:13", "throughput": 2364.75, "total_tokens": 24892784} {"current_steps": 607, "total_steps": 1080, "loss": 0.0887, "lr": 2.0158409454858103e-05, "epoch": 11.036697247706423, "percentage": 56.2, "elapsed_time": "2:55:45", "remaining_time": "2:16:57", "throughput": 2364.65, "total_tokens": 24937192} {"current_steps": 608, "total_steps": 1080, "loss": 0.0425, "lr": 2.0087084761679245e-05, "epoch": 11.055045871559633, "percentage": 56.3, "elapsed_time": "2:56:02", "remaining_time": "2:16:40", "throughput": 2364.96, "total_tokens": 24980608} {"current_steps": 609, "total_steps": 1080, "loss": 0.0788, "lr": 2.0015801639570074e-05, "epoch": 11.073394495412844, "percentage": 56.39, "elapsed_time": "2:56:22", "remaining_time": "2:16:24", "throughput": 2365.21, "total_tokens": 25029016} {"current_steps": 610, "total_steps": 1080, "loss": 0.0387, "lr": 1.9944560691699057e-05, "epoch": 11.091743119266056, "percentage": 56.48, "elapsed_time": "2:56:42", "remaining_time": "2:16:08", "throughput": 2364.76, "total_tokens": 25071880} {"current_steps": 611, "total_steps": 1080, "loss": 0.0534, "lr": 1.9873362520877813e-05, "epoch": 11.110091743119266, "percentage": 56.57, "elapsed_time": "2:57:02", "remaining_time": "2:15:53", "throughput": 2364.6, "total_tokens": 25117112} {"current_steps": 612, "total_steps": 1080, "loss": 0.0509, "lr": 1.980220772955602e-05, "epoch": 11.128440366972477, "percentage": 56.67, "elapsed_time": "2:57:17", "remaining_time": "2:15:34", "throughput": 2364.7, "total_tokens": 25154456} {"current_steps": 613, "total_steps": 1080, "loss": 0.0436, "lr": 1.973109691981627e-05, "epoch": 11.146788990825687, "percentage": 56.76, "elapsed_time": "2:57:34", "remaining_time": "2:15:16", "throughput": 2364.66, "total_tokens": 25193264} {"current_steps": 614, "total_steps": 1080, "loss": 0.04, "lr": 1.9660030693369004e-05, "epoch": 11.1651376146789, "percentage": 56.85, "elapsed_time": "2:57:49", "remaining_time": "2:14:57", "throughput": 2364.78, "total_tokens": 25231416} {"current_steps": 615, "total_steps": 1080, "loss": 0.0371, "lr": 1.958900965154743e-05, "epoch": 11.18348623853211, "percentage": 56.94, "elapsed_time": "2:58:05", "remaining_time": "2:14:39", "throughput": 2364.63, "total_tokens": 25268136} {"current_steps": 616, "total_steps": 1080, "loss": 0.0986, "lr": 1.9518034395302414e-05, "epoch": 11.20183486238532, "percentage": 57.04, "elapsed_time": "2:58:26", "remaining_time": "2:14:24", "throughput": 2364.68, "total_tokens": 25316600} {"current_steps": 617, "total_steps": 1080, "loss": 0.0391, "lr": 1.9447105525197425e-05, "epoch": 11.220183486238533, "percentage": 57.13, "elapsed_time": "2:58:44", "remaining_time": "2:14:07", "throughput": 2364.49, "total_tokens": 25358424} {"current_steps": 618, "total_steps": 1080, "loss": 0.0378, "lr": 1.937622364140338e-05, "epoch": 11.238532110091743, "percentage": 57.22, "elapsed_time": "2:59:04", "remaining_time": "2:13:52", "throughput": 2364.35, "total_tokens": 25403744} {"current_steps": 619, "total_steps": 1080, "loss": 0.0412, "lr": 1.9305389343693664e-05, "epoch": 11.256880733944953, "percentage": 57.31, "elapsed_time": "2:59:18", "remaining_time": "2:13:32", "throughput": 2364.28, "total_tokens": 25436496} {"current_steps": 620, "total_steps": 1080, "loss": 0.0473, "lr": 1.9234603231438995e-05, "epoch": 11.275229357798166, "percentage": 57.41, "elapsed_time": "2:59:34", "remaining_time": "2:13:14", "throughput": 2364.45, "total_tokens": 25476544} {"current_steps": 621, "total_steps": 1080, "loss": 0.0874, "lr": 1.9163865903602374e-05, "epoch": 11.293577981651376, "percentage": 57.5, "elapsed_time": "2:59:53", "remaining_time": "2:12:58", "throughput": 2363.83, "total_tokens": 25514768} {"current_steps": 622, "total_steps": 1080, "loss": 0.0377, "lr": 1.9093177958733966e-05, "epoch": 11.311926605504587, "percentage": 57.59, "elapsed_time": "3:00:14", "remaining_time": "2:12:42", "throughput": 2363.77, "total_tokens": 25562136} {"current_steps": 623, "total_steps": 1080, "loss": 0.0338, "lr": 1.9022539994966147e-05, "epoch": 11.330275229357799, "percentage": 57.69, "elapsed_time": "3:00:28", "remaining_time": "2:12:23", "throughput": 2364.05, "total_tokens": 25599784} {"current_steps": 624, "total_steps": 1080, "loss": 0.0368, "lr": 1.895195261000831e-05, "epoch": 11.34862385321101, "percentage": 57.78, "elapsed_time": "3:00:42", "remaining_time": "2:12:03", "throughput": 2364.29, "total_tokens": 25633664} {"current_steps": 625, "total_steps": 1080, "loss": 0.0817, "lr": 1.8881416401141904e-05, "epoch": 11.36697247706422, "percentage": 57.87, "elapsed_time": "3:01:05", "remaining_time": "2:11:50", "throughput": 2364.03, "total_tokens": 25686344} {"current_steps": 626, "total_steps": 1080, "loss": 0.042, "lr": 1.8810931965215356e-05, "epoch": 11.385321100917432, "percentage": 57.96, "elapsed_time": "3:01:25", "remaining_time": "2:11:34", "throughput": 2363.88, "total_tokens": 25731184} {"current_steps": 627, "total_steps": 1080, "loss": 0.0803, "lr": 1.874049989863896e-05, "epoch": 11.403669724770642, "percentage": 58.06, "elapsed_time": "3:01:41", "remaining_time": "2:11:16", "throughput": 2364.12, "total_tokens": 25773632} {"current_steps": 628, "total_steps": 1080, "loss": 0.043, "lr": 1.8670120797379958e-05, "epoch": 11.422018348623853, "percentage": 58.15, "elapsed_time": "3:01:55", "remaining_time": "2:10:56", "throughput": 2363.99, "total_tokens": 25803376} {"current_steps": 629, "total_steps": 1080, "loss": 0.0389, "lr": 1.859979525695736e-05, "epoch": 11.440366972477065, "percentage": 58.24, "elapsed_time": "3:02:18", "remaining_time": "2:10:42", "throughput": 2363.72, "total_tokens": 25855248} {"current_steps": 630, "total_steps": 1080, "loss": 0.0429, "lr": 1.852952387243698e-05, "epoch": 11.458715596330276, "percentage": 58.33, "elapsed_time": "3:02:31", "remaining_time": "2:10:22", "throughput": 2363.79, "total_tokens": 25885840} {"current_steps": 631, "total_steps": 1080, "loss": 0.0466, "lr": 1.8459307238426416e-05, "epoch": 11.477064220183486, "percentage": 58.43, "elapsed_time": "3:02:53", "remaining_time": "2:10:08", "throughput": 2363.87, "total_tokens": 25938800} {"current_steps": 632, "total_steps": 1080, "loss": 0.0543, "lr": 1.838914594906995e-05, "epoch": 11.495412844036696, "percentage": 58.52, "elapsed_time": "3:03:08", "remaining_time": "2:09:49", "throughput": 2363.72, "total_tokens": 25973752} {"current_steps": 633, "total_steps": 1080, "loss": 0.0408, "lr": 1.831904059804358e-05, "epoch": 11.513761467889909, "percentage": 58.61, "elapsed_time": "3:03:24", "remaining_time": "2:09:30", "throughput": 2363.7, "total_tokens": 26011480} {"current_steps": 634, "total_steps": 1080, "loss": 0.0462, "lr": 1.8248991778549984e-05, "epoch": 11.53211009174312, "percentage": 58.7, "elapsed_time": "3:03:42", "remaining_time": "2:09:14", "throughput": 2363.72, "total_tokens": 26054744} {"current_steps": 635, "total_steps": 1080, "loss": 0.0478, "lr": 1.8179000083313483e-05, "epoch": 11.55045871559633, "percentage": 58.8, "elapsed_time": "3:03:54", "remaining_time": "2:08:53", "throughput": 2363.74, "total_tokens": 26083512} {"current_steps": 636, "total_steps": 1080, "loss": 0.0376, "lr": 1.8109066104575023e-05, "epoch": 11.568807339449542, "percentage": 58.89, "elapsed_time": "3:04:12", "remaining_time": "2:08:35", "throughput": 2363.92, "total_tokens": 26127504} {"current_steps": 637, "total_steps": 1080, "loss": 0.0399, "lr": 1.8039190434087212e-05, "epoch": 11.587155963302752, "percentage": 58.98, "elapsed_time": "3:04:29", "remaining_time": "2:08:18", "throughput": 2364.18, "total_tokens": 26170568} {"current_steps": 638, "total_steps": 1080, "loss": 0.0658, "lr": 1.7969373663109234e-05, "epoch": 11.605504587155963, "percentage": 59.07, "elapsed_time": "3:04:50", "remaining_time": "2:08:03", "throughput": 2364.25, "total_tokens": 26221816} {"current_steps": 639, "total_steps": 1080, "loss": 0.0384, "lr": 1.7899616382401936e-05, "epoch": 11.623853211009175, "percentage": 59.17, "elapsed_time": "3:05:06", "remaining_time": "2:07:45", "throughput": 2364.54, "total_tokens": 26262800} {"current_steps": 640, "total_steps": 1080, "loss": 0.0357, "lr": 1.7829919182222752e-05, "epoch": 11.642201834862385, "percentage": 59.26, "elapsed_time": "3:05:27", "remaining_time": "2:07:29", "throughput": 2364.61, "total_tokens": 26311200} {"current_steps": 641, "total_steps": 1080, "loss": 0.0445, "lr": 1.776028265232073e-05, "epoch": 11.660550458715596, "percentage": 59.35, "elapsed_time": "3:05:46", "remaining_time": "2:07:13", "throughput": 2364.87, "total_tokens": 26359400} {"current_steps": 642, "total_steps": 1080, "loss": 0.0352, "lr": 1.7690707381931583e-05, "epoch": 11.678899082568808, "percentage": 59.44, "elapsed_time": "3:06:02", "remaining_time": "2:06:55", "throughput": 2365.14, "total_tokens": 26401144} {"current_steps": 643, "total_steps": 1080, "loss": 0.0381, "lr": 1.7621193959772657e-05, "epoch": 11.697247706422019, "percentage": 59.54, "elapsed_time": "3:06:14", "remaining_time": "2:06:34", "throughput": 2365.07, "total_tokens": 26429056} {"current_steps": 644, "total_steps": 1080, "loss": 0.0448, "lr": 1.755174297403795e-05, "epoch": 11.715596330275229, "percentage": 59.63, "elapsed_time": "3:06:35", "remaining_time": "2:06:19", "throughput": 2365.1, "total_tokens": 26478272} {"current_steps": 645, "total_steps": 1080, "loss": 0.044, "lr": 1.7482355012393177e-05, "epoch": 11.73394495412844, "percentage": 59.72, "elapsed_time": "3:06:53", "remaining_time": "2:06:02", "throughput": 2365.53, "total_tokens": 26525592} {"current_steps": 646, "total_steps": 1080, "loss": 0.0392, "lr": 1.7413030661970742e-05, "epoch": 11.752293577981652, "percentage": 59.81, "elapsed_time": "3:07:10", "remaining_time": "2:05:45", "throughput": 2365.43, "total_tokens": 26565280} {"current_steps": 647, "total_steps": 1080, "loss": 0.0356, "lr": 1.73437705093648e-05, "epoch": 11.770642201834862, "percentage": 59.91, "elapsed_time": "3:07:27", "remaining_time": "2:05:27", "throughput": 2365.2, "total_tokens": 26601768} {"current_steps": 648, "total_steps": 1080, "loss": 0.0425, "lr": 1.7274575140626318e-05, "epoch": 11.788990825688073, "percentage": 60.0, "elapsed_time": "3:07:39", "remaining_time": "2:05:06", "throughput": 2365.48, "total_tokens": 26634496} {"current_steps": 649, "total_steps": 1080, "loss": 0.0504, "lr": 1.720544514125805e-05, "epoch": 11.807339449541285, "percentage": 60.09, "elapsed_time": "3:07:58", "remaining_time": "2:04:50", "throughput": 2365.47, "total_tokens": 26679232} {"current_steps": 650, "total_steps": 1080, "loss": 0.0566, "lr": 1.7136381096209664e-05, "epoch": 11.825688073394495, "percentage": 60.19, "elapsed_time": "3:08:17", "remaining_time": "2:04:33", "throughput": 2365.46, "total_tokens": 26723144} {"current_steps": 651, "total_steps": 1080, "loss": 0.0397, "lr": 1.7067383589872703e-05, "epoch": 11.844036697247706, "percentage": 60.28, "elapsed_time": "3:08:33", "remaining_time": "2:04:15", "throughput": 2365.39, "total_tokens": 26760448} {"current_steps": 652, "total_steps": 1080, "loss": 0.0372, "lr": 1.699845320607571e-05, "epoch": 11.862385321100918, "percentage": 60.37, "elapsed_time": "3:09:02", "remaining_time": "2:04:05", "throughput": 2364.67, "total_tokens": 26820856} {"current_steps": 653, "total_steps": 1080, "loss": 0.0932, "lr": 1.692959052807928e-05, "epoch": 11.880733944954128, "percentage": 60.46, "elapsed_time": "3:09:15", "remaining_time": "2:03:45", "throughput": 2364.63, "total_tokens": 26851736} {"current_steps": 654, "total_steps": 1080, "loss": 0.0632, "lr": 1.686079613857109e-05, "epoch": 11.899082568807339, "percentage": 60.56, "elapsed_time": "3:09:31", "remaining_time": "2:03:27", "throughput": 2364.88, "total_tokens": 26892976} {"current_steps": 655, "total_steps": 1080, "loss": 0.0806, "lr": 1.6792070619660975e-05, "epoch": 11.917431192660551, "percentage": 60.65, "elapsed_time": "3:09:49", "remaining_time": "2:03:10", "throughput": 2364.71, "total_tokens": 26933888} {"current_steps": 656, "total_steps": 1080, "loss": 0.0414, "lr": 1.672341455287605e-05, "epoch": 11.935779816513762, "percentage": 60.74, "elapsed_time": "3:10:05", "remaining_time": "2:02:52", "throughput": 2364.62, "total_tokens": 26970576} {"current_steps": 657, "total_steps": 1080, "loss": 0.0356, "lr": 1.665482851915573e-05, "epoch": 11.954128440366972, "percentage": 60.83, "elapsed_time": "3:10:20", "remaining_time": "2:02:33", "throughput": 2364.87, "total_tokens": 27008400} {"current_steps": 658, "total_steps": 1080, "loss": 0.074, "lr": 1.658631309884684e-05, "epoch": 11.972477064220184, "percentage": 60.93, "elapsed_time": "3:10:34", "remaining_time": "2:02:13", "throughput": 2365.01, "total_tokens": 27043704} {"current_steps": 659, "total_steps": 1080, "loss": 0.0473, "lr": 1.6517868871698725e-05, "epoch": 11.990825688073395, "percentage": 61.02, "elapsed_time": "3:10:51", "remaining_time": "2:01:55", "throughput": 2365.23, "total_tokens": 27084456} {"current_steps": 660, "total_steps": 1080, "loss": 0.0369, "lr": 1.6449496416858284e-05, "epoch": 12.0, "percentage": 61.11, "elapsed_time": "3:10:59", "remaining_time": "2:01:32", "throughput": 2365.58, "total_tokens": 27109056} {"current_steps": 661, "total_steps": 1080, "loss": 0.0767, "lr": 1.6381196312865145e-05, "epoch": 12.01834862385321, "percentage": 61.2, "elapsed_time": "3:11:16", "remaining_time": "2:01:14", "throughput": 2365.54, "total_tokens": 27147704} {"current_steps": 662, "total_steps": 1080, "loss": 0.0398, "lr": 1.6312969137646716e-05, "epoch": 12.036697247706423, "percentage": 61.3, "elapsed_time": "3:11:38", "remaining_time": "2:01:00", "throughput": 2365.38, "total_tokens": 27197376} {"current_steps": 663, "total_steps": 1080, "loss": 0.0373, "lr": 1.6244815468513315e-05, "epoch": 12.055045871559633, "percentage": 61.39, "elapsed_time": "3:11:57", "remaining_time": "2:00:43", "throughput": 2365.48, "total_tokens": 27244056} {"current_steps": 664, "total_steps": 1080, "loss": 0.042, "lr": 1.617673588215328e-05, "epoch": 12.073394495412844, "percentage": 61.48, "elapsed_time": "3:12:07", "remaining_time": "2:00:22", "throughput": 2365.52, "total_tokens": 27269576} {"current_steps": 665, "total_steps": 1080, "loss": 0.0317, "lr": 1.6108730954628093e-05, "epoch": 12.091743119266056, "percentage": 61.57, "elapsed_time": "3:12:28", "remaining_time": "2:00:07", "throughput": 2365.18, "total_tokens": 27314640} {"current_steps": 666, "total_steps": 1080, "loss": 0.0382, "lr": 1.6040801261367493e-05, "epoch": 12.110091743119266, "percentage": 61.67, "elapsed_time": "3:12:46", "remaining_time": "1:59:50", "throughput": 2365.28, "total_tokens": 27358840} {"current_steps": 667, "total_steps": 1080, "loss": 0.0378, "lr": 1.5972947377164645e-05, "epoch": 12.128440366972477, "percentage": 61.76, "elapsed_time": "3:13:02", "remaining_time": "1:59:31", "throughput": 2365.58, "total_tokens": 27399112} {"current_steps": 668, "total_steps": 1080, "loss": 0.0322, "lr": 1.5905169876171223e-05, "epoch": 12.146788990825687, "percentage": 61.85, "elapsed_time": "3:13:17", "remaining_time": "1:59:13", "throughput": 2365.47, "total_tokens": 27434064} {"current_steps": 669, "total_steps": 1080, "loss": 0.0421, "lr": 1.583746933189257e-05, "epoch": 12.1651376146789, "percentage": 61.94, "elapsed_time": "3:13:30", "remaining_time": "1:58:53", "throughput": 2365.8, "total_tokens": 27468528} {"current_steps": 670, "total_steps": 1080, "loss": 0.0682, "lr": 1.5769846317182893e-05, "epoch": 12.18348623853211, "percentage": 62.04, "elapsed_time": "3:13:49", "remaining_time": "1:58:36", "throughput": 2365.34, "total_tokens": 27508512} {"current_steps": 671, "total_steps": 1080, "loss": 0.0328, "lr": 1.570230140424033e-05, "epoch": 12.20183486238532, "percentage": 62.13, "elapsed_time": "3:14:08", "remaining_time": "1:58:19", "throughput": 2365.71, "total_tokens": 27555912} {"current_steps": 672, "total_steps": 1080, "loss": 0.0346, "lr": 1.56348351646022e-05, "epoch": 12.220183486238533, "percentage": 62.22, "elapsed_time": "3:14:27", "remaining_time": "1:58:03", "throughput": 2365.38, "total_tokens": 27597608} {"current_steps": 673, "total_steps": 1080, "loss": 0.037, "lr": 1.556744816914008e-05, "epoch": 12.238532110091743, "percentage": 62.31, "elapsed_time": "3:14:43", "remaining_time": "1:57:45", "throughput": 2365.22, "total_tokens": 27633496} {"current_steps": 674, "total_steps": 1080, "loss": 0.0286, "lr": 1.550014098805503e-05, "epoch": 12.256880733944953, "percentage": 62.41, "elapsed_time": "3:15:04", "remaining_time": "1:57:30", "throughput": 2364.85, "total_tokens": 27680040} {"current_steps": 675, "total_steps": 1080, "loss": 0.0308, "lr": 1.5432914190872757e-05, "epoch": 12.275229357798166, "percentage": 62.5, "elapsed_time": "3:15:22", "remaining_time": "1:57:13", "throughput": 2364.89, "total_tokens": 27721872} {"current_steps": 676, "total_steps": 1080, "loss": 0.0294, "lr": 1.5365768346438797e-05, "epoch": 12.293577981651376, "percentage": 62.59, "elapsed_time": "3:15:39", "remaining_time": "1:56:55", "throughput": 2364.93, "total_tokens": 27762968} {"current_steps": 677, "total_steps": 1080, "loss": 0.0283, "lr": 1.529870402291368e-05, "epoch": 12.311926605504587, "percentage": 62.69, "elapsed_time": "3:15:57", "remaining_time": "1:56:39", "throughput": 2365.16, "total_tokens": 27809496} {"current_steps": 678, "total_steps": 1080, "loss": 0.027, "lr": 1.523172178776816e-05, "epoch": 12.330275229357799, "percentage": 62.78, "elapsed_time": "3:16:17", "remaining_time": "1:56:23", "throughput": 2365.28, "total_tokens": 27857160} {"current_steps": 679, "total_steps": 1080, "loss": 0.0351, "lr": 1.5164822207778379e-05, "epoch": 12.34862385321101, "percentage": 62.87, "elapsed_time": "3:16:44", "remaining_time": "1:56:11", "throughput": 2365.24, "total_tokens": 27920616} {"current_steps": 680, "total_steps": 1080, "loss": 0.0749, "lr": 1.509800584902108e-05, "epoch": 12.36697247706422, "percentage": 62.96, "elapsed_time": "3:17:05", "remaining_time": "1:55:56", "throughput": 2365.44, "total_tokens": 27971920} {"current_steps": 681, "total_steps": 1080, "loss": 0.048, "lr": 1.5031273276868845e-05, "epoch": 12.385321100917432, "percentage": 63.06, "elapsed_time": "3:17:20", "remaining_time": "1:55:37", "throughput": 2365.45, "total_tokens": 28008960} {"current_steps": 682, "total_steps": 1080, "loss": 0.0319, "lr": 1.4964625055985265e-05, "epoch": 12.403669724770642, "percentage": 63.15, "elapsed_time": "3:17:41", "remaining_time": "1:55:22", "throughput": 2365.24, "total_tokens": 28055416} {"current_steps": 683, "total_steps": 1080, "loss": 0.0403, "lr": 1.4898061750320212e-05, "epoch": 12.422018348623853, "percentage": 63.24, "elapsed_time": "3:17:57", "remaining_time": "1:55:03", "throughput": 2365.3, "total_tokens": 28093136} {"current_steps": 684, "total_steps": 1080, "loss": 0.0377, "lr": 1.4831583923104999e-05, "epoch": 12.440366972477065, "percentage": 63.33, "elapsed_time": "3:18:22", "remaining_time": "1:54:50", "throughput": 2365.27, "total_tokens": 28152744} {"current_steps": 685, "total_steps": 1080, "loss": 0.0631, "lr": 1.4765192136847685e-05, "epoch": 12.458715596330276, "percentage": 63.43, "elapsed_time": "3:18:46", "remaining_time": "1:54:37", "throughput": 2364.91, "total_tokens": 28205712} {"current_steps": 686, "total_steps": 1080, "loss": 0.0304, "lr": 1.4698886953328292e-05, "epoch": 12.477064220183486, "percentage": 63.52, "elapsed_time": "3:19:02", "remaining_time": "1:54:19", "throughput": 2365.29, "total_tokens": 28248432} {"current_steps": 687, "total_steps": 1080, "loss": 0.0612, "lr": 1.463266893359403e-05, "epoch": 12.495412844036696, "percentage": 63.61, "elapsed_time": "3:19:17", "remaining_time": "1:54:00", "throughput": 2365.19, "total_tokens": 28282728} {"current_steps": 688, "total_steps": 1080, "loss": 0.0436, "lr": 1.4566538637954554e-05, "epoch": 12.513761467889909, "percentage": 63.7, "elapsed_time": "3:19:37", "remaining_time": "1:53:44", "throughput": 2365.24, "total_tokens": 28330200} {"current_steps": 689, "total_steps": 1080, "loss": 0.0339, "lr": 1.4500496625977264e-05, "epoch": 12.53211009174312, "percentage": 63.8, "elapsed_time": "3:19:53", "remaining_time": "1:53:26", "throughput": 2365.4, "total_tokens": 28368752} {"current_steps": 690, "total_steps": 1080, "loss": 0.0332, "lr": 1.443454345648252e-05, "epoch": 12.55045871559633, "percentage": 63.89, "elapsed_time": "3:20:09", "remaining_time": "1:53:07", "throughput": 2365.35, "total_tokens": 28405528} {"current_steps": 691, "total_steps": 1080, "loss": 0.0378, "lr": 1.436867968753893e-05, "epoch": 12.568807339449542, "percentage": 63.98, "elapsed_time": "3:20:28", "remaining_time": "1:52:51", "throughput": 2365.33, "total_tokens": 28451400} {"current_steps": 692, "total_steps": 1080, "loss": 0.0407, "lr": 1.430290587645865e-05, "epoch": 12.587155963302752, "percentage": 64.07, "elapsed_time": "3:20:49", "remaining_time": "1:52:36", "throughput": 2365.38, "total_tokens": 28501600} {"current_steps": 693, "total_steps": 1080, "loss": 0.0362, "lr": 1.4237222579792618e-05, "epoch": 12.605504587155963, "percentage": 64.17, "elapsed_time": "3:21:02", "remaining_time": "1:52:16", "throughput": 2365.43, "total_tokens": 28532400} {"current_steps": 694, "total_steps": 1080, "loss": 0.0423, "lr": 1.4171630353325932e-05, "epoch": 12.623853211009175, "percentage": 64.26, "elapsed_time": "3:21:18", "remaining_time": "1:51:58", "throughput": 2365.2, "total_tokens": 28568872} {"current_steps": 695, "total_steps": 1080, "loss": 0.0365, "lr": 1.4106129752073022e-05, "epoch": 12.642201834862385, "percentage": 64.35, "elapsed_time": "3:21:35", "remaining_time": "1:51:40", "throughput": 2365.36, "total_tokens": 28610976} {"current_steps": 696, "total_steps": 1080, "loss": 0.083, "lr": 1.4040721330273062e-05, "epoch": 12.660550458715596, "percentage": 64.44, "elapsed_time": "3:21:57", "remaining_time": "1:51:25", "throughput": 2364.86, "total_tokens": 28657064} {"current_steps": 697, "total_steps": 1080, "loss": 0.0285, "lr": 1.3975405641385252e-05, "epoch": 12.678899082568808, "percentage": 64.54, "elapsed_time": "3:22:16", "remaining_time": "1:51:08", "throughput": 2365.07, "total_tokens": 28702912} {"current_steps": 698, "total_steps": 1080, "loss": 0.0346, "lr": 1.3910183238084112e-05, "epoch": 12.697247706422019, "percentage": 64.63, "elapsed_time": "3:22:36", "remaining_time": "1:50:53", "throughput": 2365.28, "total_tokens": 28754368} {"current_steps": 699, "total_steps": 1080, "loss": 0.0289, "lr": 1.3845054672254781e-05, "epoch": 12.715596330275229, "percentage": 64.72, "elapsed_time": "3:22:53", "remaining_time": "1:50:35", "throughput": 2365.44, "total_tokens": 28795120} {"current_steps": 700, "total_steps": 1080, "loss": 0.0288, "lr": 1.3780020494988446e-05, "epoch": 12.73394495412844, "percentage": 64.81, "elapsed_time": "3:23:11", "remaining_time": "1:50:18", "throughput": 2365.43, "total_tokens": 28837920} {"current_steps": 701, "total_steps": 1080, "loss": 0.041, "lr": 1.3715081256577582e-05, "epoch": 12.752293577981652, "percentage": 64.91, "elapsed_time": "3:23:26", "remaining_time": "1:49:59", "throughput": 2365.47, "total_tokens": 28874200} {"current_steps": 702, "total_steps": 1080, "loss": 0.0304, "lr": 1.3650237506511331e-05, "epoch": 12.770642201834862, "percentage": 65.0, "elapsed_time": "3:23:41", "remaining_time": "1:49:40", "throughput": 2365.64, "total_tokens": 28911744} {"current_steps": 703, "total_steps": 1080, "loss": 0.0292, "lr": 1.3585489793470862e-05, "epoch": 12.788990825688073, "percentage": 65.09, "elapsed_time": "3:23:53", "remaining_time": "1:49:20", "throughput": 2365.53, "total_tokens": 28938696} {"current_steps": 704, "total_steps": 1080, "loss": 0.0321, "lr": 1.3520838665324703e-05, "epoch": 12.807339449541285, "percentage": 65.19, "elapsed_time": "3:24:11", "remaining_time": "1:49:03", "throughput": 2365.34, "total_tokens": 28978360} {"current_steps": 705, "total_steps": 1080, "loss": 0.0311, "lr": 1.3456284669124158e-05, "epoch": 12.825688073394495, "percentage": 65.28, "elapsed_time": "3:24:23", "remaining_time": "1:48:43", "throughput": 2365.39, "total_tokens": 29008048} {"current_steps": 706, "total_steps": 1080, "loss": 0.0307, "lr": 1.3391828351098578e-05, "epoch": 12.844036697247706, "percentage": 65.37, "elapsed_time": "3:24:38", "remaining_time": "1:48:24", "throughput": 2365.77, "total_tokens": 29047928} {"current_steps": 707, "total_steps": 1080, "loss": 0.033, "lr": 1.3327470256650848e-05, "epoch": 12.862385321100918, "percentage": 65.46, "elapsed_time": "3:24:51", "remaining_time": "1:48:04", "throughput": 2365.92, "total_tokens": 29080376} {"current_steps": 708, "total_steps": 1080, "loss": 0.0299, "lr": 1.3263210930352737e-05, "epoch": 12.880733944954128, "percentage": 65.56, "elapsed_time": "3:25:05", "remaining_time": "1:47:45", "throughput": 2366.01, "total_tokens": 29113856} {"current_steps": 709, "total_steps": 1080, "loss": 0.0373, "lr": 1.3199050915940225e-05, "epoch": 12.899082568807339, "percentage": 65.65, "elapsed_time": "3:25:22", "remaining_time": "1:47:28", "throughput": 2366.56, "total_tokens": 29162904} {"current_steps": 710, "total_steps": 1080, "loss": 0.0344, "lr": 1.313499075630899e-05, "epoch": 12.917431192660551, "percentage": 65.74, "elapsed_time": "3:25:35", "remaining_time": "1:47:08", "throughput": 2366.75, "total_tokens": 29195920} {"current_steps": 711, "total_steps": 1080, "loss": 0.0357, "lr": 1.3071030993509788e-05, "epoch": 12.935779816513762, "percentage": 65.83, "elapsed_time": "3:25:50", "remaining_time": "1:46:49", "throughput": 2366.78, "total_tokens": 29230376} {"current_steps": 712, "total_steps": 1080, "loss": 0.058, "lr": 1.3007172168743854e-05, "epoch": 12.954128440366972, "percentage": 65.93, "elapsed_time": "3:26:05", "remaining_time": "1:46:31", "throughput": 2366.75, "total_tokens": 29266464} {"current_steps": 713, "total_steps": 1080, "loss": 0.0332, "lr": 1.2943414822358285e-05, "epoch": 12.972477064220184, "percentage": 66.02, "elapsed_time": "3:26:22", "remaining_time": "1:46:13", "throughput": 2366.91, "total_tokens": 29308840} {"current_steps": 714, "total_steps": 1080, "loss": 0.0387, "lr": 1.2879759493841575e-05, "epoch": 12.990825688073395, "percentage": 66.11, "elapsed_time": "3:26:37", "remaining_time": "1:45:55", "throughput": 2367.08, "total_tokens": 29346656} {"current_steps": 715, "total_steps": 1080, "loss": 0.0294, "lr": 1.2816206721818944e-05, "epoch": 13.0, "percentage": 66.2, "elapsed_time": "3:26:47", "remaining_time": "1:45:34", "throughput": 2366.9, "total_tokens": 29368144} {"current_steps": 716, "total_steps": 1080, "loss": 0.029, "lr": 1.2752757044047827e-05, "epoch": 13.01834862385321, "percentage": 66.3, "elapsed_time": "3:27:04", "remaining_time": "1:45:16", "throughput": 2366.87, "total_tokens": 29406696} {"current_steps": 717, "total_steps": 1080, "loss": 0.0292, "lr": 1.2689410997413325e-05, "epoch": 13.036697247706423, "percentage": 66.39, "elapsed_time": "3:27:21", "remaining_time": "1:44:58", "throughput": 2366.92, "total_tokens": 29447448} {"current_steps": 718, "total_steps": 1080, "loss": 0.031, "lr": 1.262616911792365e-05, "epoch": 13.055045871559633, "percentage": 66.48, "elapsed_time": "3:27:39", "remaining_time": "1:44:41", "throughput": 2367.16, "total_tokens": 29493904} {"current_steps": 719, "total_steps": 1080, "loss": 0.033, "lr": 1.2563031940705594e-05, "epoch": 13.073394495412844, "percentage": 66.57, "elapsed_time": "3:27:55", "remaining_time": "1:44:23", "throughput": 2367.28, "total_tokens": 29533272} {"current_steps": 720, "total_steps": 1080, "loss": 0.0336, "lr": 1.2500000000000006e-05, "epoch": 13.091743119266056, "percentage": 66.67, "elapsed_time": "3:28:08", "remaining_time": "1:44:04", "throughput": 2367.39, "total_tokens": 29565728} {"current_steps": 721, "total_steps": 1080, "loss": 0.0237, "lr": 1.243707382915725e-05, "epoch": 13.110091743119266, "percentage": 66.76, "elapsed_time": "3:28:24", "remaining_time": "1:43:46", "throughput": 2367.44, "total_tokens": 29604480} {"current_steps": 722, "total_steps": 1080, "loss": 0.0282, "lr": 1.2374253960632757e-05, "epoch": 13.128440366972477, "percentage": 66.85, "elapsed_time": "3:28:39", "remaining_time": "1:43:27", "throughput": 2367.53, "total_tokens": 29639856} {"current_steps": 723, "total_steps": 1080, "loss": 0.0324, "lr": 1.2311540925982403e-05, "epoch": 13.146788990825687, "percentage": 66.94, "elapsed_time": "3:28:55", "remaining_time": "1:43:09", "throughput": 2367.49, "total_tokens": 29677448} {"current_steps": 724, "total_steps": 1080, "loss": 0.0269, "lr": 1.2248935255858117e-05, "epoch": 13.1651376146789, "percentage": 67.04, "elapsed_time": "3:29:14", "remaining_time": "1:42:53", "throughput": 2367.52, "total_tokens": 29723888} {"current_steps": 725, "total_steps": 1080, "loss": 0.0252, "lr": 1.2186437480003372e-05, "epoch": 13.18348623853211, "percentage": 67.13, "elapsed_time": "3:29:31", "remaining_time": "1:42:35", "throughput": 2367.89, "total_tokens": 29767992} {"current_steps": 726, "total_steps": 1080, "loss": 0.0386, "lr": 1.2124048127248644e-05, "epoch": 13.20183486238532, "percentage": 67.22, "elapsed_time": "3:29:49", "remaining_time": "1:42:18", "throughput": 2368.21, "total_tokens": 29814304} {"current_steps": 727, "total_steps": 1080, "loss": 0.0336, "lr": 1.2061767725507006e-05, "epoch": 13.220183486238533, "percentage": 67.31, "elapsed_time": "3:30:05", "remaining_time": "1:42:00", "throughput": 2368.19, "total_tokens": 29852040} {"current_steps": 728, "total_steps": 1080, "loss": 0.0262, "lr": 1.1999596801769616e-05, "epoch": 13.238532110091743, "percentage": 67.41, "elapsed_time": "3:30:20", "remaining_time": "1:41:42", "throughput": 2368.36, "total_tokens": 29889096} {"current_steps": 729, "total_steps": 1080, "loss": 0.0251, "lr": 1.1937535882101281e-05, "epoch": 13.256880733944953, "percentage": 67.5, "elapsed_time": "3:30:36", "remaining_time": "1:41:24", "throughput": 2368.44, "total_tokens": 29927888} {"current_steps": 730, "total_steps": 1080, "loss": 0.0315, "lr": 1.1875585491636e-05, "epoch": 13.275229357798166, "percentage": 67.59, "elapsed_time": "3:30:51", "remaining_time": "1:41:05", "throughput": 2368.58, "total_tokens": 29967064} {"current_steps": 731, "total_steps": 1080, "loss": 0.0259, "lr": 1.1813746154572514e-05, "epoch": 13.293577981651376, "percentage": 67.69, "elapsed_time": "3:31:14", "remaining_time": "1:40:51", "throughput": 2368.27, "total_tokens": 30016736} {"current_steps": 732, "total_steps": 1080, "loss": 0.0274, "lr": 1.175201839416988e-05, "epoch": 13.311926605504587, "percentage": 67.78, "elapsed_time": "3:31:33", "remaining_time": "1:40:34", "throughput": 2367.85, "total_tokens": 30056888} {"current_steps": 733, "total_steps": 1080, "loss": 0.0272, "lr": 1.1690402732743042e-05, "epoch": 13.330275229357799, "percentage": 67.87, "elapsed_time": "3:31:47", "remaining_time": "1:40:15", "throughput": 2367.82, "total_tokens": 30088720} {"current_steps": 734, "total_steps": 1080, "loss": 0.0443, "lr": 1.1628899691658399e-05, "epoch": 13.34862385321101, "percentage": 67.96, "elapsed_time": "3:32:05", "remaining_time": "1:39:58", "throughput": 2367.8, "total_tokens": 30131848} {"current_steps": 735, "total_steps": 1080, "loss": 0.032, "lr": 1.1567509791329401e-05, "epoch": 13.36697247706422, "percentage": 68.06, "elapsed_time": "3:32:26", "remaining_time": "1:39:43", "throughput": 2368.14, "total_tokens": 30186336} {"current_steps": 736, "total_steps": 1080, "loss": 0.0234, "lr": 1.1506233551212186e-05, "epoch": 13.385321100917432, "percentage": 68.15, "elapsed_time": "3:32:50", "remaining_time": "1:39:28", "throughput": 2368.18, "total_tokens": 30242096} {"current_steps": 737, "total_steps": 1080, "loss": 0.0242, "lr": 1.1445071489801073e-05, "epoch": 13.403669724770642, "percentage": 68.24, "elapsed_time": "3:33:02", "remaining_time": "1:39:09", "throughput": 2368.31, "total_tokens": 30273336} {"current_steps": 738, "total_steps": 1080, "loss": 0.0328, "lr": 1.1384024124624324e-05, "epoch": 13.422018348623853, "percentage": 68.33, "elapsed_time": "3:33:14", "remaining_time": "1:38:49", "throughput": 2368.24, "total_tokens": 30300544} {"current_steps": 739, "total_steps": 1080, "loss": 0.0223, "lr": 1.1323091972239635e-05, "epoch": 13.440366972477065, "percentage": 68.43, "elapsed_time": "3:33:30", "remaining_time": "1:38:31", "throughput": 2368.69, "total_tokens": 30343952} {"current_steps": 740, "total_steps": 1080, "loss": 0.0237, "lr": 1.126227554822985e-05, "epoch": 13.458715596330276, "percentage": 68.52, "elapsed_time": "3:33:50", "remaining_time": "1:38:15", "throughput": 2368.85, "total_tokens": 30393960} {"current_steps": 741, "total_steps": 1080, "loss": 0.0513, "lr": 1.1201575367198547e-05, "epoch": 13.477064220183486, "percentage": 68.61, "elapsed_time": "3:34:10", "remaining_time": "1:37:58", "throughput": 2368.88, "total_tokens": 30441256} {"current_steps": 742, "total_steps": 1080, "loss": 0.0276, "lr": 1.1140991942765713e-05, "epoch": 13.495412844036696, "percentage": 68.7, "elapsed_time": "3:34:27", "remaining_time": "1:37:41", "throughput": 2368.72, "total_tokens": 30480016} {"current_steps": 743, "total_steps": 1080, "loss": 0.0544, "lr": 1.1080525787563393e-05, "epoch": 13.513761467889909, "percentage": 68.8, "elapsed_time": "3:34:49", "remaining_time": "1:37:26", "throughput": 2368.7, "total_tokens": 30531440} {"current_steps": 744, "total_steps": 1080, "loss": 0.0252, "lr": 1.1020177413231334e-05, "epoch": 13.53211009174312, "percentage": 68.89, "elapsed_time": "3:35:07", "remaining_time": "1:37:09", "throughput": 2368.67, "total_tokens": 30572720} {"current_steps": 745, "total_steps": 1080, "loss": 0.0328, "lr": 1.0959947330412682e-05, "epoch": 13.55045871559633, "percentage": 68.98, "elapsed_time": "3:35:23", "remaining_time": "1:36:51", "throughput": 2368.55, "total_tokens": 30610416} {"current_steps": 746, "total_steps": 1080, "loss": 0.0232, "lr": 1.0899836048749645e-05, "epoch": 13.568807339449542, "percentage": 69.07, "elapsed_time": "3:35:44", "remaining_time": "1:36:35", "throughput": 2368.32, "total_tokens": 30656448} {"current_steps": 747, "total_steps": 1080, "loss": 0.0277, "lr": 1.0839844076879185e-05, "epoch": 13.587155963302752, "percentage": 69.17, "elapsed_time": "3:35:56", "remaining_time": "1:36:15", "throughput": 2368.41, "total_tokens": 30685584} {"current_steps": 748, "total_steps": 1080, "loss": 0.0289, "lr": 1.0779971922428711e-05, "epoch": 13.605504587155963, "percentage": 69.26, "elapsed_time": "3:36:14", "remaining_time": "1:35:58", "throughput": 2368.5, "total_tokens": 30729472} {"current_steps": 749, "total_steps": 1080, "loss": 0.0371, "lr": 1.0720220092011782e-05, "epoch": 13.623853211009175, "percentage": 69.35, "elapsed_time": "3:36:29", "remaining_time": "1:35:40", "throughput": 2368.57, "total_tokens": 30765400} {"current_steps": 750, "total_steps": 1080, "loss": 0.032, "lr": 1.0660589091223855e-05, "epoch": 13.642201834862385, "percentage": 69.44, "elapsed_time": "3:36:49", "remaining_time": "1:35:23", "throughput": 2368.53, "total_tokens": 30812288} {"current_steps": 751, "total_steps": 1080, "loss": 0.027, "lr": 1.0601079424637917e-05, "epoch": 13.660550458715596, "percentage": 69.54, "elapsed_time": "3:37:07", "remaining_time": "1:35:06", "throughput": 2368.56, "total_tokens": 30855592} {"current_steps": 752, "total_steps": 1080, "loss": 0.0337, "lr": 1.0541691595800337e-05, "epoch": 13.678899082568808, "percentage": 69.63, "elapsed_time": "3:37:21", "remaining_time": "1:34:48", "throughput": 2368.65, "total_tokens": 30890072} {"current_steps": 753, "total_steps": 1080, "loss": 0.0238, "lr": 1.0482426107226507e-05, "epoch": 13.697247706422019, "percentage": 69.72, "elapsed_time": "3:37:37", "remaining_time": "1:34:30", "throughput": 2368.5, "total_tokens": 30927336} {"current_steps": 754, "total_steps": 1080, "loss": 0.0294, "lr": 1.0423283460396633e-05, "epoch": 13.715596330275229, "percentage": 69.81, "elapsed_time": "3:37:52", "remaining_time": "1:34:12", "throughput": 2368.81, "total_tokens": 30966920} {"current_steps": 755, "total_steps": 1080, "loss": 0.0281, "lr": 1.0364264155751488e-05, "epoch": 13.73394495412844, "percentage": 69.91, "elapsed_time": "3:38:12", "remaining_time": "1:33:55", "throughput": 2368.92, "total_tokens": 31015544} {"current_steps": 756, "total_steps": 1080, "loss": 0.0311, "lr": 1.0305368692688174e-05, "epoch": 13.752293577981652, "percentage": 70.0, "elapsed_time": "3:38:28", "remaining_time": "1:33:38", "throughput": 2368.84, "total_tokens": 31052688} {"current_steps": 757, "total_steps": 1080, "loss": 0.0205, "lr": 1.0246597569555894e-05, "epoch": 13.770642201834862, "percentage": 70.09, "elapsed_time": "3:38:45", "remaining_time": "1:33:20", "throughput": 2368.83, "total_tokens": 31092736} {"current_steps": 758, "total_steps": 1080, "loss": 0.038, "lr": 1.0187951283651736e-05, "epoch": 13.788990825688073, "percentage": 70.19, "elapsed_time": "3:38:59", "remaining_time": "1:33:01", "throughput": 2368.72, "total_tokens": 31123536} {"current_steps": 759, "total_steps": 1080, "loss": 0.0321, "lr": 1.0129430331216471e-05, "epoch": 13.807339449541285, "percentage": 70.28, "elapsed_time": "3:39:13", "remaining_time": "1:32:42", "throughput": 2368.81, "total_tokens": 31157144} {"current_steps": 760, "total_steps": 1080, "loss": 0.0267, "lr": 1.0071035207430352e-05, "epoch": 13.825688073394495, "percentage": 70.37, "elapsed_time": "3:39:40", "remaining_time": "1:32:29", "throughput": 2368.82, "total_tokens": 31222320} {"current_steps": 761, "total_steps": 1080, "loss": 0.0261, "lr": 1.001276640640891e-05, "epoch": 13.844036697247706, "percentage": 70.46, "elapsed_time": "3:40:06", "remaining_time": "1:32:15", "throughput": 2368.44, "total_tokens": 31277880} {"current_steps": 762, "total_steps": 1080, "loss": 0.0639, "lr": 9.954624421198792e-06, "epoch": 13.862385321100918, "percentage": 70.56, "elapsed_time": "3:40:33", "remaining_time": "1:32:02", "throughput": 2368.2, "total_tokens": 31338856} {"current_steps": 763, "total_steps": 1080, "loss": 0.0338, "lr": 9.89660974377359e-06, "epoch": 13.880733944954128, "percentage": 70.65, "elapsed_time": "3:40:48", "remaining_time": "1:31:44", "throughput": 2368.25, "total_tokens": 31376304} {"current_steps": 764, "total_steps": 1080, "loss": 0.0371, "lr": 9.838722865029673e-06, "epoch": 13.899082568807339, "percentage": 70.74, "elapsed_time": "3:41:02", "remaining_time": "1:31:25", "throughput": 2368.46, "total_tokens": 31410672} {"current_steps": 765, "total_steps": 1080, "loss": 0.0241, "lr": 9.780964274781984e-06, "epoch": 13.917431192660551, "percentage": 70.83, "elapsed_time": "3:41:16", "remaining_time": "1:31:06", "throughput": 2368.51, "total_tokens": 31444928} {"current_steps": 766, "total_steps": 1080, "loss": 0.0357, "lr": 9.723334461760006e-06, "epoch": 13.935779816513762, "percentage": 70.93, "elapsed_time": "3:41:31", "remaining_time": "1:30:48", "throughput": 2368.56, "total_tokens": 31482232} {"current_steps": 767, "total_steps": 1080, "loss": 0.0312, "lr": 9.665833913603523e-06, "epoch": 13.954128440366972, "percentage": 71.02, "elapsed_time": "3:41:45", "remaining_time": "1:30:29", "throughput": 2368.49, "total_tokens": 31513856} {"current_steps": 768, "total_steps": 1080, "loss": 0.0584, "lr": 9.608463116858542e-06, "epoch": 13.972477064220184, "percentage": 71.11, "elapsed_time": "3:42:08", "remaining_time": "1:30:14", "throughput": 2368.14, "total_tokens": 31563800} {"current_steps": 769, "total_steps": 1080, "loss": 0.0356, "lr": 9.551222556973172e-06, "epoch": 13.990825688073395, "percentage": 71.2, "elapsed_time": "3:42:27", "remaining_time": "1:29:58", "throughput": 2367.96, "total_tokens": 31606368} {"current_steps": 770, "total_steps": 1080, "loss": 0.0511, "lr": 9.494112718293501e-06, "epoch": 14.0, "percentage": 71.3, "elapsed_time": "3:42:36", "remaining_time": "1:29:37", "throughput": 2367.85, "total_tokens": 31627232} {"current_steps": 771, "total_steps": 1080, "loss": 0.0237, "lr": 9.437134084059515e-06, "epoch": 14.01834862385321, "percentage": 71.39, "elapsed_time": "3:42:54", "remaining_time": "1:29:20", "throughput": 2367.81, "total_tokens": 31669296} {"current_steps": 772, "total_steps": 1080, "loss": 0.026, "lr": 9.380287136401e-06, "epoch": 14.036697247706423, "percentage": 71.48, "elapsed_time": "3:43:09", "remaining_time": "1:29:01", "throughput": 2367.84, "total_tokens": 31704400} {"current_steps": 773, "total_steps": 1080, "loss": 0.0252, "lr": 9.323572356333454e-06, "epoch": 14.055045871559633, "percentage": 71.57, "elapsed_time": "3:43:23", "remaining_time": "1:28:43", "throughput": 2368.03, "total_tokens": 31739048} {"current_steps": 774, "total_steps": 1080, "loss": 0.0175, "lr": 9.266990223754069e-06, "epoch": 14.073394495412844, "percentage": 71.67, "elapsed_time": "3:43:36", "remaining_time": "1:28:24", "throughput": 2368.38, "total_tokens": 31776056} {"current_steps": 775, "total_steps": 1080, "loss": 0.0269, "lr": 9.210541217437565e-06, "epoch": 14.091743119266056, "percentage": 71.76, "elapsed_time": "3:43:51", "remaining_time": "1:28:05", "throughput": 2368.68, "total_tokens": 31814504} {"current_steps": 776, "total_steps": 1080, "loss": 0.0283, "lr": 9.154225815032242e-06, "epoch": 14.110091743119266, "percentage": 71.85, "elapsed_time": "3:44:04", "remaining_time": "1:27:46", "throughput": 2368.76, "total_tokens": 31846928} {"current_steps": 777, "total_steps": 1080, "loss": 0.0256, "lr": 9.098044493055899e-06, "epoch": 14.128440366972477, "percentage": 71.94, "elapsed_time": "3:44:24", "remaining_time": "1:27:30", "throughput": 2368.63, "total_tokens": 31893152} {"current_steps": 778, "total_steps": 1080, "loss": 0.0202, "lr": 9.0419977268918e-06, "epoch": 14.146788990825687, "percentage": 72.04, "elapsed_time": "3:44:41", "remaining_time": "1:27:13", "throughput": 2368.93, "total_tokens": 31937456} {"current_steps": 779, "total_steps": 1080, "loss": 0.0301, "lr": 8.98608599078462e-06, "epoch": 14.1651376146789, "percentage": 72.13, "elapsed_time": "3:44:56", "remaining_time": "1:26:54", "throughput": 2368.75, "total_tokens": 31969928} {"current_steps": 780, "total_steps": 1080, "loss": 0.0256, "lr": 8.930309757836517e-06, "epoch": 14.18348623853211, "percentage": 72.22, "elapsed_time": "3:45:27", "remaining_time": "1:26:43", "throughput": 2367.92, "total_tokens": 32032920} {"current_steps": 781, "total_steps": 1080, "loss": 0.0247, "lr": 8.874669500003049e-06, "epoch": 14.20183486238532, "percentage": 72.31, "elapsed_time": "3:45:49", "remaining_time": "1:26:27", "throughput": 2368.27, "total_tokens": 32087928} {"current_steps": 782, "total_steps": 1080, "loss": 0.026, "lr": 8.819165688089193e-06, "epoch": 14.220183486238533, "percentage": 72.41, "elapsed_time": "3:46:09", "remaining_time": "1:26:10", "throughput": 2368.15, "total_tokens": 32133632} {"current_steps": 783, "total_steps": 1080, "loss": 0.0307, "lr": 8.763798791745411e-06, "epoch": 14.238532110091743, "percentage": 72.5, "elapsed_time": "3:46:29", "remaining_time": "1:25:54", "throughput": 2367.88, "total_tokens": 32178024} {"current_steps": 784, "total_steps": 1080, "loss": 0.028, "lr": 8.708569279463622e-06, "epoch": 14.256880733944953, "percentage": 72.59, "elapsed_time": "3:46:52", "remaining_time": "1:25:39", "throughput": 2367.7, "total_tokens": 32229216} {"current_steps": 785, "total_steps": 1080, "loss": 0.047, "lr": 8.65347761857326e-06, "epoch": 14.275229357798166, "percentage": 72.69, "elapsed_time": "3:47:13", "remaining_time": "1:25:23", "throughput": 2367.67, "total_tokens": 32279544} {"current_steps": 786, "total_steps": 1080, "loss": 0.0221, "lr": 8.598524275237322e-06, "epoch": 14.293577981651376, "percentage": 72.78, "elapsed_time": "3:47:28", "remaining_time": "1:25:05", "throughput": 2367.63, "total_tokens": 32314736} {"current_steps": 787, "total_steps": 1080, "loss": 0.0211, "lr": 8.543709714448403e-06, "epoch": 14.311926605504587, "percentage": 72.87, "elapsed_time": "3:47:47", "remaining_time": "1:24:48", "throughput": 2367.46, "total_tokens": 32357232} {"current_steps": 788, "total_steps": 1080, "loss": 0.0304, "lr": 8.489034400024812e-06, "epoch": 14.330275229357799, "percentage": 72.96, "elapsed_time": "3:48:02", "remaining_time": "1:24:30", "throughput": 2367.49, "total_tokens": 32392992} {"current_steps": 789, "total_steps": 1080, "loss": 0.0225, "lr": 8.434498794606568e-06, "epoch": 14.34862385321101, "percentage": 73.06, "elapsed_time": "3:48:20", "remaining_time": "1:24:13", "throughput": 2367.41, "total_tokens": 32434840} {"current_steps": 790, "total_steps": 1080, "loss": 0.0195, "lr": 8.380103359651553e-06, "epoch": 14.36697247706422, "percentage": 73.15, "elapsed_time": "3:48:39", "remaining_time": "1:23:56", "throughput": 2367.46, "total_tokens": 32480592} {"current_steps": 791, "total_steps": 1080, "loss": 0.0258, "lr": 8.325848555431595e-06, "epoch": 14.385321100917432, "percentage": 73.24, "elapsed_time": "3:48:53", "remaining_time": "1:23:37", "throughput": 2367.45, "total_tokens": 32514440} {"current_steps": 792, "total_steps": 1080, "loss": 0.045, "lr": 8.271734841028553e-06, "epoch": 14.403669724770642, "percentage": 73.33, "elapsed_time": "3:49:11", "remaining_time": "1:23:20", "throughput": 2367.46, "total_tokens": 32557176} {"current_steps": 793, "total_steps": 1080, "loss": 0.0304, "lr": 8.217762674330413e-06, "epoch": 14.422018348623853, "percentage": 73.43, "elapsed_time": "3:49:28", "remaining_time": "1:23:02", "throughput": 2367.36, "total_tokens": 32594416} {"current_steps": 794, "total_steps": 1080, "loss": 0.0178, "lr": 8.163932512027492e-06, "epoch": 14.440366972477065, "percentage": 73.52, "elapsed_time": "3:49:46", "remaining_time": "1:22:45", "throughput": 2367.41, "total_tokens": 32638344} {"current_steps": 795, "total_steps": 1080, "loss": 0.0336, "lr": 8.110244809608495e-06, "epoch": 14.458715596330276, "percentage": 73.61, "elapsed_time": "3:50:00", "remaining_time": "1:22:27", "throughput": 2367.62, "total_tokens": 32674416} {"current_steps": 796, "total_steps": 1080, "loss": 0.0309, "lr": 8.056700021356694e-06, "epoch": 14.477064220183486, "percentage": 73.7, "elapsed_time": "3:50:23", "remaining_time": "1:22:12", "throughput": 2367.36, "total_tokens": 32725808} {"current_steps": 797, "total_steps": 1080, "loss": 0.0247, "lr": 8.003298600346085e-06, "epoch": 14.495412844036696, "percentage": 73.8, "elapsed_time": "3:50:38", "remaining_time": "1:21:53", "throughput": 2367.44, "total_tokens": 32761224} {"current_steps": 798, "total_steps": 1080, "loss": 0.0235, "lr": 7.950040998437542e-06, "epoch": 14.513761467889909, "percentage": 73.89, "elapsed_time": "3:51:00", "remaining_time": "1:21:38", "throughput": 2367.34, "total_tokens": 32812208} {"current_steps": 799, "total_steps": 1080, "loss": 0.0195, "lr": 7.896927666275006e-06, "epoch": 14.53211009174312, "percentage": 73.98, "elapsed_time": "3:51:18", "remaining_time": "1:21:21", "throughput": 2367.52, "total_tokens": 32858672} {"current_steps": 800, "total_steps": 1080, "loss": 0.0397, "lr": 7.843959053281663e-06, "epoch": 14.55045871559633, "percentage": 74.07, "elapsed_time": "3:51:41", "remaining_time": "1:21:05", "throughput": 2367.06, "total_tokens": 32905792} {"current_steps": 801, "total_steps": 1080, "loss": 0.0216, "lr": 7.791135607656147e-06, "epoch": 14.568807339449542, "percentage": 74.17, "elapsed_time": "3:51:58", "remaining_time": "1:20:48", "throughput": 2367.1, "total_tokens": 32946456} {"current_steps": 802, "total_steps": 1080, "loss": 0.0201, "lr": 7.738457776368766e-06, "epoch": 14.587155963302752, "percentage": 74.26, "elapsed_time": "3:52:13", "remaining_time": "1:20:29", "throughput": 2367.32, "total_tokens": 32985008} {"current_steps": 803, "total_steps": 1080, "loss": 0.0229, "lr": 7.685926005157651e-06, "epoch": 14.605504587155963, "percentage": 74.35, "elapsed_time": "3:52:32", "remaining_time": "1:20:13", "throughput": 2367.27, "total_tokens": 33029600} {"current_steps": 804, "total_steps": 1080, "loss": 0.0268, "lr": 7.633540738525066e-06, "epoch": 14.623853211009175, "percentage": 74.44, "elapsed_time": "3:52:47", "remaining_time": "1:19:54", "throughput": 2367.25, "total_tokens": 33064056} {"current_steps": 805, "total_steps": 1080, "loss": 0.0241, "lr": 7.581302419733632e-06, "epoch": 14.642201834862385, "percentage": 74.54, "elapsed_time": "3:53:01", "remaining_time": "1:19:36", "throughput": 2367.42, "total_tokens": 33099880} {"current_steps": 806, "total_steps": 1080, "loss": 0.0244, "lr": 7.529211490802498e-06, "epoch": 14.660550458715596, "percentage": 74.63, "elapsed_time": "3:53:15", "remaining_time": "1:19:17", "throughput": 2367.48, "total_tokens": 33134376} {"current_steps": 807, "total_steps": 1080, "loss": 0.0225, "lr": 7.477268392503728e-06, "epoch": 14.678899082568808, "percentage": 74.72, "elapsed_time": "3:53:31", "remaining_time": "1:18:59", "throughput": 2367.57, "total_tokens": 33172056} {"current_steps": 808, "total_steps": 1080, "loss": 0.0241, "lr": 7.4254735643584564e-06, "epoch": 14.697247706422019, "percentage": 74.81, "elapsed_time": "3:53:56", "remaining_time": "1:18:45", "throughput": 2367.06, "total_tokens": 33224448} {"current_steps": 809, "total_steps": 1080, "loss": 0.0228, "lr": 7.3738274446332415e-06, "epoch": 14.715596330275229, "percentage": 74.91, "elapsed_time": "3:54:13", "remaining_time": "1:18:27", "throughput": 2367.03, "total_tokens": 33264800} {"current_steps": 810, "total_steps": 1080, "loss": 0.025, "lr": 7.3223304703363135e-06, "epoch": 14.73394495412844, "percentage": 75.0, "elapsed_time": "3:54:28", "remaining_time": "1:18:09", "throughput": 2367.01, "total_tokens": 33300896} {"current_steps": 811, "total_steps": 1080, "loss": 0.0243, "lr": 7.270983077213911e-06, "epoch": 14.752293577981652, "percentage": 75.09, "elapsed_time": "3:54:43", "remaining_time": "1:17:51", "throughput": 2367.0, "total_tokens": 33335304} {"current_steps": 812, "total_steps": 1080, "loss": 0.0186, "lr": 7.219785699746573e-06, "epoch": 14.770642201834862, "percentage": 75.19, "elapsed_time": "3:55:02", "remaining_time": "1:17:34", "throughput": 2367.24, "total_tokens": 33382912} {"current_steps": 813, "total_steps": 1080, "loss": 0.0299, "lr": 7.168738771145464e-06, "epoch": 14.788990825688073, "percentage": 75.28, "elapsed_time": "3:55:19", "remaining_time": "1:17:16", "throughput": 2367.2, "total_tokens": 33422688} {"current_steps": 814, "total_steps": 1080, "loss": 0.0301, "lr": 7.117842723348717e-06, "epoch": 14.807339449541285, "percentage": 75.37, "elapsed_time": "3:55:33", "remaining_time": "1:16:58", "throughput": 2367.26, "total_tokens": 33456520} {"current_steps": 815, "total_steps": 1080, "loss": 0.0285, "lr": 7.067097987017762e-06, "epoch": 14.825688073394495, "percentage": 75.46, "elapsed_time": "3:55:51", "remaining_time": "1:16:41", "throughput": 2367.32, "total_tokens": 33501112} {"current_steps": 816, "total_steps": 1080, "loss": 0.0314, "lr": 7.016504991533726e-06, "epoch": 14.844036697247706, "percentage": 75.56, "elapsed_time": "3:56:06", "remaining_time": "1:16:23", "throughput": 2367.29, "total_tokens": 33535160} {"current_steps": 817, "total_steps": 1080, "loss": 0.0289, "lr": 6.9660641649937155e-06, "epoch": 14.862385321100918, "percentage": 75.65, "elapsed_time": "3:56:27", "remaining_time": "1:16:07", "throughput": 2367.15, "total_tokens": 33583896} {"current_steps": 818, "total_steps": 1080, "loss": 0.0225, "lr": 6.9157759342072995e-06, "epoch": 14.880733944954128, "percentage": 75.74, "elapsed_time": "3:56:40", "remaining_time": "1:15:48", "throughput": 2367.33, "total_tokens": 33616680} {"current_steps": 819, "total_steps": 1080, "loss": 0.029, "lr": 6.865640724692815e-06, "epoch": 14.899082568807339, "percentage": 75.83, "elapsed_time": "3:56:55", "remaining_time": "1:15:30", "throughput": 2367.26, "total_tokens": 33652496} {"current_steps": 820, "total_steps": 1080, "loss": 0.0379, "lr": 6.815658960673782e-06, "epoch": 14.917431192660551, "percentage": 75.93, "elapsed_time": "3:57:15", "remaining_time": "1:15:13", "throughput": 2366.99, "total_tokens": 33695760} {"current_steps": 821, "total_steps": 1080, "loss": 0.0224, "lr": 6.765831065075367e-06, "epoch": 14.935779816513762, "percentage": 76.02, "elapsed_time": "3:57:31", "remaining_time": "1:14:55", "throughput": 2367.09, "total_tokens": 33734472} {"current_steps": 822, "total_steps": 1080, "loss": 0.0243, "lr": 6.716157459520739e-06, "epoch": 14.954128440366972, "percentage": 76.11, "elapsed_time": "3:57:56", "remaining_time": "1:14:41", "throughput": 2366.93, "total_tokens": 33792456} {"current_steps": 823, "total_steps": 1080, "loss": 0.0203, "lr": 6.666638564327532e-06, "epoch": 14.972477064220184, "percentage": 76.2, "elapsed_time": "3:58:14", "remaining_time": "1:14:23", "throughput": 2367.17, "total_tokens": 33837616} {"current_steps": 824, "total_steps": 1080, "loss": 0.0316, "lr": 6.617274798504286e-06, "epoch": 14.990825688073395, "percentage": 76.3, "elapsed_time": "3:58:27", "remaining_time": "1:14:04", "throughput": 2367.45, "total_tokens": 33871912} {"current_steps": 825, "total_steps": 1080, "loss": 0.038, "lr": 6.568066579746901e-06, "epoch": 15.0, "percentage": 76.39, "elapsed_time": "3:58:33", "remaining_time": "1:13:44", "throughput": 2367.39, "total_tokens": 33886320} {"current_steps": 826, "total_steps": 1080, "loss": 0.0212, "lr": 6.519014324435102e-06, "epoch": 15.01834862385321, "percentage": 76.48, "elapsed_time": "3:58:51", "remaining_time": "1:13:26", "throughput": 2367.51, "total_tokens": 33929160} {"current_steps": 827, "total_steps": 1080, "loss": 0.0303, "lr": 6.470118447628912e-06, "epoch": 15.036697247706423, "percentage": 76.57, "elapsed_time": "3:59:11", "remaining_time": "1:13:10", "throughput": 2367.46, "total_tokens": 33976056} {"current_steps": 828, "total_steps": 1080, "loss": 0.0394, "lr": 6.421379363065142e-06, "epoch": 15.055045871559633, "percentage": 76.67, "elapsed_time": "3:59:28", "remaining_time": "1:12:53", "throughput": 2367.45, "total_tokens": 34016992} {"current_steps": 829, "total_steps": 1080, "loss": 0.0238, "lr": 6.3727974831539115e-06, "epoch": 15.073394495412844, "percentage": 76.76, "elapsed_time": "3:59:45", "remaining_time": "1:12:35", "throughput": 2367.29, "total_tokens": 34054944} {"current_steps": 830, "total_steps": 1080, "loss": 0.0382, "lr": 6.324373218975105e-06, "epoch": 15.091743119266056, "percentage": 76.85, "elapsed_time": "4:00:04", "remaining_time": "1:12:18", "throughput": 2367.38, "total_tokens": 34100400} {"current_steps": 831, "total_steps": 1080, "loss": 0.0195, "lr": 6.2761069802749455e-06, "epoch": 15.110091743119266, "percentage": 76.94, "elapsed_time": "4:00:26", "remaining_time": "1:12:02", "throughput": 2367.47, "total_tokens": 34154080} {"current_steps": 832, "total_steps": 1080, "loss": 0.0192, "lr": 6.22799917546252e-06, "epoch": 15.128440366972477, "percentage": 77.04, "elapsed_time": "4:00:51", "remaining_time": "1:11:47", "throughput": 2367.3, "total_tokens": 34211416} {"current_steps": 833, "total_steps": 1080, "loss": 0.0225, "lr": 6.180050211606303e-06, "epoch": 15.146788990825687, "percentage": 77.13, "elapsed_time": "4:01:08", "remaining_time": "1:11:30", "throughput": 2367.25, "total_tokens": 34250208} {"current_steps": 834, "total_steps": 1080, "loss": 0.0188, "lr": 6.1322604944307e-06, "epoch": 15.1651376146789, "percentage": 77.22, "elapsed_time": "4:01:32", "remaining_time": "1:11:14", "throughput": 2367.19, "total_tokens": 34305792} {"current_steps": 835, "total_steps": 1080, "loss": 0.0205, "lr": 6.08463042831268e-06, "epoch": 15.18348623853211, "percentage": 77.31, "elapsed_time": "4:01:48", "remaining_time": "1:10:57", "throughput": 2367.2, "total_tokens": 34345272} {"current_steps": 836, "total_steps": 1080, "loss": 0.0241, "lr": 6.037160416278278e-06, "epoch": 15.20183486238532, "percentage": 77.41, "elapsed_time": "4:02:03", "remaining_time": "1:10:38", "throughput": 2367.34, "total_tokens": 34381752} {"current_steps": 837, "total_steps": 1080, "loss": 0.0203, "lr": 5.989850859999227e-06, "epoch": 15.220183486238533, "percentage": 77.5, "elapsed_time": "4:02:20", "remaining_time": "1:10:21", "throughput": 2367.43, "total_tokens": 34423552} {"current_steps": 838, "total_steps": 1080, "loss": 0.0204, "lr": 5.942702159789554e-06, "epoch": 15.238532110091743, "percentage": 77.59, "elapsed_time": "4:02:36", "remaining_time": "1:10:03", "throughput": 2367.63, "total_tokens": 34463296} {"current_steps": 839, "total_steps": 1080, "loss": 0.0262, "lr": 5.895714714602171e-06, "epoch": 15.256880733944953, "percentage": 77.69, "elapsed_time": "4:02:49", "remaining_time": "1:09:44", "throughput": 2367.62, "total_tokens": 34494592} {"current_steps": 840, "total_steps": 1080, "loss": 0.0232, "lr": 5.848888922025553e-06, "epoch": 15.275229357798166, "percentage": 77.78, "elapsed_time": "4:03:06", "remaining_time": "1:09:27", "throughput": 2367.63, "total_tokens": 34536560} {"current_steps": 841, "total_steps": 1080, "loss": 0.0244, "lr": 5.802225178280288e-06, "epoch": 15.293577981651376, "percentage": 77.87, "elapsed_time": "4:03:18", "remaining_time": "1:09:08", "throughput": 2367.72, "total_tokens": 34565424} {"current_steps": 842, "total_steps": 1080, "loss": 0.0178, "lr": 5.755723878215802e-06, "epoch": 15.311926605504587, "percentage": 77.96, "elapsed_time": "4:03:38", "remaining_time": "1:08:52", "throughput": 2367.87, "total_tokens": 34615248} {"current_steps": 843, "total_steps": 1080, "loss": 0.0237, "lr": 5.709385415307006e-06, "epoch": 15.330275229357799, "percentage": 78.06, "elapsed_time": "4:03:51", "remaining_time": "1:08:33", "throughput": 2367.81, "total_tokens": 34643648} {"current_steps": 844, "total_steps": 1080, "loss": 0.0189, "lr": 5.663210181650905e-06, "epoch": 15.34862385321101, "percentage": 78.15, "elapsed_time": "4:04:08", "remaining_time": "1:08:15", "throughput": 2367.46, "total_tokens": 34678888} {"current_steps": 845, "total_steps": 1080, "loss": 0.0228, "lr": 5.617198567963352e-06, "epoch": 15.36697247706422, "percentage": 78.24, "elapsed_time": "4:04:24", "remaining_time": "1:07:58", "throughput": 2367.38, "total_tokens": 34717536} {"current_steps": 846, "total_steps": 1080, "loss": 0.0187, "lr": 5.571350963575728e-06, "epoch": 15.385321100917432, "percentage": 78.33, "elapsed_time": "4:04:40", "remaining_time": "1:07:40", "throughput": 2367.41, "total_tokens": 34755840} {"current_steps": 847, "total_steps": 1080, "loss": 0.0277, "lr": 5.525667756431616e-06, "epoch": 15.403669724770642, "percentage": 78.43, "elapsed_time": "4:04:55", "remaining_time": "1:07:22", "throughput": 2367.35, "total_tokens": 34788648} {"current_steps": 848, "total_steps": 1080, "loss": 0.0261, "lr": 5.48014933308352e-06, "epoch": 15.422018348623853, "percentage": 78.52, "elapsed_time": "4:05:07", "remaining_time": "1:07:03", "throughput": 2367.38, "total_tokens": 34818368} {"current_steps": 849, "total_steps": 1080, "loss": 0.0243, "lr": 5.434796078689652e-06, "epoch": 15.440366972477065, "percentage": 78.61, "elapsed_time": "4:05:33", "remaining_time": "1:06:48", "throughput": 2367.32, "total_tokens": 34877832} {"current_steps": 850, "total_steps": 1080, "loss": 0.0195, "lr": 5.389608377010608e-06, "epoch": 15.458715596330276, "percentage": 78.7, "elapsed_time": "4:05:54", "remaining_time": "1:06:32", "throughput": 2367.43, "total_tokens": 34929560} {"current_steps": 851, "total_steps": 1080, "loss": 0.0198, "lr": 5.344586610406146e-06, "epoch": 15.477064220183486, "percentage": 78.8, "elapsed_time": "4:06:10", "remaining_time": "1:06:14", "throughput": 2367.55, "total_tokens": 34969976} {"current_steps": 852, "total_steps": 1080, "loss": 0.0169, "lr": 5.299731159831953e-06, "epoch": 15.495412844036696, "percentage": 78.89, "elapsed_time": "4:06:26", "remaining_time": "1:05:56", "throughput": 2367.66, "total_tokens": 35008288} {"current_steps": 853, "total_steps": 1080, "loss": 0.0314, "lr": 5.2550424048364185e-06, "epoch": 15.513761467889909, "percentage": 78.98, "elapsed_time": "4:06:41", "remaining_time": "1:05:38", "throughput": 2367.72, "total_tokens": 35045016} {"current_steps": 854, "total_steps": 1080, "loss": 0.0192, "lr": 5.210520723557419e-06, "epoch": 15.53211009174312, "percentage": 79.07, "elapsed_time": "4:06:59", "remaining_time": "1:05:21", "throughput": 2367.57, "total_tokens": 35085312} {"current_steps": 855, "total_steps": 1080, "loss": 0.0243, "lr": 5.166166492719124e-06, "epoch": 15.55045871559633, "percentage": 79.17, "elapsed_time": "4:07:17", "remaining_time": "1:05:04", "throughput": 2367.68, "total_tokens": 35130040} {"current_steps": 856, "total_steps": 1080, "loss": 0.026, "lr": 5.121980087628803e-06, "epoch": 15.568807339449542, "percentage": 79.26, "elapsed_time": "4:07:34", "remaining_time": "1:04:47", "throughput": 2367.66, "total_tokens": 35169456} {"current_steps": 857, "total_steps": 1080, "loss": 0.0177, "lr": 5.077961882173676e-06, "epoch": 15.587155963302752, "percentage": 79.35, "elapsed_time": "4:07:52", "remaining_time": "1:04:30", "throughput": 2367.84, "total_tokens": 35216632} {"current_steps": 858, "total_steps": 1080, "loss": 0.0175, "lr": 5.034112248817685e-06, "epoch": 15.605504587155963, "percentage": 79.44, "elapsed_time": "4:08:12", "remaining_time": "1:04:13", "throughput": 2367.82, "total_tokens": 35263048} {"current_steps": 859, "total_steps": 1080, "loss": 0.0182, "lr": 4.990431558598408e-06, "epoch": 15.623853211009175, "percentage": 79.54, "elapsed_time": "4:08:29", "remaining_time": "1:03:55", "throughput": 2368.12, "total_tokens": 35306376} {"current_steps": 860, "total_steps": 1080, "loss": 0.0236, "lr": 4.946920181123904e-06, "epoch": 15.642201834862385, "percentage": 79.63, "elapsed_time": "4:08:44", "remaining_time": "1:03:37", "throughput": 2368.0, "total_tokens": 35341168} {"current_steps": 861, "total_steps": 1080, "loss": 0.0178, "lr": 4.903578484569568e-06, "epoch": 15.660550458715596, "percentage": 79.72, "elapsed_time": "4:09:00", "remaining_time": "1:03:20", "throughput": 2367.86, "total_tokens": 35376920} {"current_steps": 862, "total_steps": 1080, "loss": 0.0257, "lr": 4.860406835675016e-06, "epoch": 15.678899082568808, "percentage": 79.81, "elapsed_time": "4:09:20", "remaining_time": "1:03:03", "throughput": 2368.24, "total_tokens": 35430304} {"current_steps": 863, "total_steps": 1080, "loss": 0.0218, "lr": 4.817405599741004e-06, "epoch": 15.697247706422019, "percentage": 79.91, "elapsed_time": "4:09:36", "remaining_time": "1:02:45", "throughput": 2368.12, "total_tokens": 35466728} {"current_steps": 864, "total_steps": 1080, "loss": 0.0231, "lr": 4.7745751406263165e-06, "epoch": 15.715596330275229, "percentage": 80.0, "elapsed_time": "4:09:51", "remaining_time": "1:02:27", "throughput": 2368.21, "total_tokens": 35503792} {"current_steps": 865, "total_steps": 1080, "loss": 0.0372, "lr": 4.731915820744695e-06, "epoch": 15.73394495412844, "percentage": 80.09, "elapsed_time": "4:10:13", "remaining_time": "1:02:11", "throughput": 2367.61, "total_tokens": 35545312} {"current_steps": 866, "total_steps": 1080, "loss": 0.0281, "lr": 4.689428001061774e-06, "epoch": 15.752293577981652, "percentage": 80.19, "elapsed_time": "4:10:26", "remaining_time": "1:01:53", "throughput": 2367.51, "total_tokens": 35576480} {"current_steps": 867, "total_steps": 1080, "loss": 0.0214, "lr": 4.647112041092022e-06, "epoch": 15.770642201834862, "percentage": 80.28, "elapsed_time": "4:10:41", "remaining_time": "1:01:35", "throughput": 2367.61, "total_tokens": 35613240} {"current_steps": 868, "total_steps": 1080, "loss": 0.0296, "lr": 4.604968298895703e-06, "epoch": 15.788990825688073, "percentage": 80.37, "elapsed_time": "4:11:06", "remaining_time": "1:01:19", "throughput": 2367.55, "total_tokens": 35671328} {"current_steps": 869, "total_steps": 1080, "loss": 0.0256, "lr": 4.562997131075841e-06, "epoch": 15.807339449541285, "percentage": 80.46, "elapsed_time": "4:11:18", "remaining_time": "1:01:01", "throughput": 2367.61, "total_tokens": 35701032} {"current_steps": 870, "total_steps": 1080, "loss": 0.0247, "lr": 4.521198892775203e-06, "epoch": 15.825688073394495, "percentage": 80.56, "elapsed_time": "4:11:46", "remaining_time": "1:00:46", "throughput": 2367.16, "total_tokens": 35759112} {"current_steps": 871, "total_steps": 1080, "loss": 0.0222, "lr": 4.479573937673326e-06, "epoch": 15.844036697247706, "percentage": 80.65, "elapsed_time": "4:12:01", "remaining_time": "1:00:28", "throughput": 2367.19, "total_tokens": 35794232} {"current_steps": 872, "total_steps": 1080, "loss": 0.0266, "lr": 4.438122617983443e-06, "epoch": 15.862385321100918, "percentage": 80.74, "elapsed_time": "4:12:14", "remaining_time": "1:00:09", "throughput": 2367.21, "total_tokens": 35825360} {"current_steps": 873, "total_steps": 1080, "loss": 0.0238, "lr": 4.396845284449608e-06, "epoch": 15.880733944954128, "percentage": 80.83, "elapsed_time": "4:12:29", "remaining_time": "0:59:52", "throughput": 2367.15, "total_tokens": 35860784} {"current_steps": 874, "total_steps": 1080, "loss": 0.0243, "lr": 4.355742286343648e-06, "epoch": 15.899082568807339, "percentage": 80.93, "elapsed_time": "4:12:53", "remaining_time": "0:59:36", "throughput": 2367.02, "total_tokens": 35915640} {"current_steps": 875, "total_steps": 1080, "loss": 0.019, "lr": 4.314813971462237e-06, "epoch": 15.917431192660551, "percentage": 81.02, "elapsed_time": "4:13:13", "remaining_time": "0:59:19", "throughput": 2367.52, "total_tokens": 35970056} {"current_steps": 876, "total_steps": 1080, "loss": 0.0224, "lr": 4.274060686123959e-06, "epoch": 15.935779816513762, "percentage": 81.11, "elapsed_time": "4:13:26", "remaining_time": "0:59:01", "throughput": 2367.69, "total_tokens": 36004072} {"current_steps": 877, "total_steps": 1080, "loss": 0.0199, "lr": 4.233482775166364e-06, "epoch": 15.954128440366972, "percentage": 81.2, "elapsed_time": "4:13:50", "remaining_time": "0:58:45", "throughput": 2367.38, "total_tokens": 36056968} {"current_steps": 878, "total_steps": 1080, "loss": 0.0256, "lr": 4.19308058194306e-06, "epoch": 15.972477064220184, "percentage": 81.3, "elapsed_time": "4:14:04", "remaining_time": "0:58:27", "throughput": 2367.5, "total_tokens": 36091736} {"current_steps": 879, "total_steps": 1080, "loss": 0.0245, "lr": 4.152854448320797e-06, "epoch": 15.990825688073395, "percentage": 81.39, "elapsed_time": "4:14:21", "remaining_time": "0:58:09", "throughput": 2367.4, "total_tokens": 36129176} {"current_steps": 880, "total_steps": 1080, "loss": 0.028, "lr": 4.112804714676594e-06, "epoch": 16.0, "percentage": 81.48, "elapsed_time": "4:14:28", "remaining_time": "0:57:50", "throughput": 2367.38, "total_tokens": 36145408} {"current_steps": 881, "total_steps": 1080, "loss": 0.0203, "lr": 4.072931719894829e-06, "epoch": 16.01834862385321, "percentage": 81.57, "elapsed_time": "4:14:46", "remaining_time": "0:57:32", "throughput": 2367.24, "total_tokens": 36186960} {"current_steps": 882, "total_steps": 1080, "loss": 0.0187, "lr": 4.0332358013644016e-06, "epoch": 16.03669724770642, "percentage": 81.67, "elapsed_time": "4:15:10", "remaining_time": "0:57:16", "throughput": 2367.3, "total_tokens": 36243640} {"current_steps": 883, "total_steps": 1080, "loss": 0.0224, "lr": 3.993717294975863e-06, "epoch": 16.05504587155963, "percentage": 81.76, "elapsed_time": "4:15:27", "remaining_time": "0:56:59", "throughput": 2367.29, "total_tokens": 36285344} {"current_steps": 884, "total_steps": 1080, "loss": 0.0264, "lr": 3.954376535118562e-06, "epoch": 16.073394495412845, "percentage": 81.85, "elapsed_time": "4:15:41", "remaining_time": "0:56:41", "throughput": 2367.22, "total_tokens": 36316512} {"current_steps": 885, "total_steps": 1080, "loss": 0.0182, "lr": 3.9152138546778625e-06, "epoch": 16.091743119266056, "percentage": 81.94, "elapsed_time": "4:15:56", "remaining_time": "0:56:23", "throughput": 2367.17, "total_tokens": 36351392} {"current_steps": 886, "total_steps": 1080, "loss": 0.0198, "lr": 3.876229585032245e-06, "epoch": 16.110091743119266, "percentage": 82.04, "elapsed_time": "4:16:10", "remaining_time": "0:56:05", "throughput": 2367.27, "total_tokens": 36385144} {"current_steps": 887, "total_steps": 1080, "loss": 0.0244, "lr": 3.837424056050598e-06, "epoch": 16.128440366972477, "percentage": 82.13, "elapsed_time": "4:16:25", "remaining_time": "0:55:47", "throughput": 2367.37, "total_tokens": 36423008} {"current_steps": 888, "total_steps": 1080, "loss": 0.0226, "lr": 3.798797596089351e-06, "epoch": 16.146788990825687, "percentage": 82.22, "elapsed_time": "4:16:38", "remaining_time": "0:55:29", "throughput": 2367.4, "total_tokens": 36454768} {"current_steps": 889, "total_steps": 1080, "loss": 0.0208, "lr": 3.760350531989737e-06, "epoch": 16.165137614678898, "percentage": 82.31, "elapsed_time": "4:16:58", "remaining_time": "0:55:12", "throughput": 2367.52, "total_tokens": 36503200} {"current_steps": 890, "total_steps": 1080, "loss": 0.0186, "lr": 3.7220831890750067e-06, "epoch": 16.18348623853211, "percentage": 82.41, "elapsed_time": "4:17:15", "remaining_time": "0:54:55", "throughput": 2367.56, "total_tokens": 36544752} {"current_steps": 891, "total_steps": 1080, "loss": 0.024, "lr": 3.6839958911476957e-06, "epoch": 16.201834862385322, "percentage": 82.5, "elapsed_time": "4:17:32", "remaining_time": "0:54:37", "throughput": 2367.79, "total_tokens": 36589352} {"current_steps": 892, "total_steps": 1080, "loss": 0.0244, "lr": 3.6460889604868626e-06, "epoch": 16.220183486238533, "percentage": 82.59, "elapsed_time": "4:17:46", "remaining_time": "0:54:19", "throughput": 2367.68, "total_tokens": 36619488} {"current_steps": 893, "total_steps": 1080, "loss": 0.023, "lr": 3.608362717845376e-06, "epoch": 16.238532110091743, "percentage": 82.69, "elapsed_time": "4:18:02", "remaining_time": "0:54:02", "throughput": 2367.81, "total_tokens": 36659792} {"current_steps": 894, "total_steps": 1080, "loss": 0.0185, "lr": 3.5708174824471947e-06, "epoch": 16.256880733944953, "percentage": 82.78, "elapsed_time": "4:18:20", "remaining_time": "0:53:44", "throughput": 2367.76, "total_tokens": 36700648} {"current_steps": 895, "total_steps": 1080, "loss": 0.0285, "lr": 3.5334535719846766e-06, "epoch": 16.275229357798164, "percentage": 82.87, "elapsed_time": "4:18:43", "remaining_time": "0:53:28", "throughput": 2367.77, "total_tokens": 36755856} {"current_steps": 896, "total_steps": 1080, "loss": 0.0204, "lr": 3.4962713026158694e-06, "epoch": 16.293577981651374, "percentage": 82.96, "elapsed_time": "4:18:57", "remaining_time": "0:53:10", "throughput": 2367.72, "total_tokens": 36788392} {"current_steps": 897, "total_steps": 1080, "loss": 0.0184, "lr": 3.4592709889618545e-06, "epoch": 16.31192660550459, "percentage": 83.06, "elapsed_time": "4:19:10", "remaining_time": "0:52:52", "throughput": 2367.82, "total_tokens": 36821312} {"current_steps": 898, "total_steps": 1080, "loss": 0.0332, "lr": 3.4224529441040904e-06, "epoch": 16.3302752293578, "percentage": 83.15, "elapsed_time": "4:19:29", "remaining_time": "0:52:35", "throughput": 2367.46, "total_tokens": 36859304} {"current_steps": 899, "total_steps": 1080, "loss": 0.0202, "lr": 3.3858174795817404e-06, "epoch": 16.34862385321101, "percentage": 83.24, "elapsed_time": "4:19:47", "remaining_time": "0:52:18", "throughput": 2367.59, "total_tokens": 36905288} {"current_steps": 900, "total_steps": 1080, "loss": 0.0207, "lr": 3.3493649053890326e-06, "epoch": 16.36697247706422, "percentage": 83.33, "elapsed_time": "4:20:08", "remaining_time": "0:52:01", "throughput": 2367.48, "total_tokens": 36951576} {"current_steps": 901, "total_steps": 1080, "loss": 0.02, "lr": 3.313095529972687e-06, "epoch": 16.38532110091743, "percentage": 83.43, "elapsed_time": "4:20:21", "remaining_time": "0:51:43", "throughput": 2367.52, "total_tokens": 36985192} {"current_steps": 902, "total_steps": 1080, "loss": 0.0232, "lr": 3.2770096602292465e-06, "epoch": 16.40366972477064, "percentage": 83.52, "elapsed_time": "4:20:39", "remaining_time": "0:51:26", "throughput": 2367.85, "total_tokens": 37031592} {"current_steps": 903, "total_steps": 1080, "loss": 0.0199, "lr": 3.2411076015025075e-06, "epoch": 16.422018348623855, "percentage": 83.61, "elapsed_time": "4:20:55", "remaining_time": "0:51:08", "throughput": 2367.91, "total_tokens": 37070832} {"current_steps": 904, "total_steps": 1080, "loss": 0.021, "lr": 3.205389657580943e-06, "epoch": 16.440366972477065, "percentage": 83.7, "elapsed_time": "4:21:08", "remaining_time": "0:50:50", "throughput": 2367.99, "total_tokens": 37103136} {"current_steps": 905, "total_steps": 1080, "loss": 0.0202, "lr": 3.1698561306951064e-06, "epoch": 16.458715596330276, "percentage": 83.8, "elapsed_time": "4:21:26", "remaining_time": "0:50:33", "throughput": 2368.25, "total_tokens": 37148584} {"current_steps": 906, "total_steps": 1080, "loss": 0.021, "lr": 3.1345073215151066e-06, "epoch": 16.477064220183486, "percentage": 83.89, "elapsed_time": "4:21:41", "remaining_time": "0:50:15", "throughput": 2368.34, "total_tokens": 37187096} {"current_steps": 907, "total_steps": 1080, "loss": 0.0201, "lr": 3.0993435291480355e-06, "epoch": 16.495412844036696, "percentage": 83.98, "elapsed_time": "4:21:57", "remaining_time": "0:49:57", "throughput": 2368.38, "total_tokens": 37225824} {"current_steps": 908, "total_steps": 1080, "loss": 0.0178, "lr": 3.0643650511354484e-06, "epoch": 16.513761467889907, "percentage": 84.07, "elapsed_time": "4:22:12", "remaining_time": "0:49:40", "throughput": 2368.46, "total_tokens": 37262480} {"current_steps": 909, "total_steps": 1080, "loss": 0.0173, "lr": 3.029572183450868e-06, "epoch": 16.53211009174312, "percentage": 84.17, "elapsed_time": "4:22:31", "remaining_time": "0:49:23", "throughput": 2368.34, "total_tokens": 37303856} {"current_steps": 910, "total_steps": 1080, "loss": 0.0178, "lr": 2.9949652204972254e-06, "epoch": 16.55045871559633, "percentage": 84.26, "elapsed_time": "4:22:48", "remaining_time": "0:49:05", "throughput": 2368.26, "total_tokens": 37342760} {"current_steps": 911, "total_steps": 1080, "loss": 0.018, "lr": 2.9605444551044166e-06, "epoch": 16.568807339449542, "percentage": 84.35, "elapsed_time": "4:23:06", "remaining_time": "0:48:48", "throughput": 2368.28, "total_tokens": 37388064} {"current_steps": 912, "total_steps": 1080, "loss": 0.0153, "lr": 2.9263101785268254e-06, "epoch": 16.587155963302752, "percentage": 84.44, "elapsed_time": "4:23:23", "remaining_time": "0:48:31", "throughput": 2368.4, "total_tokens": 37428768} {"current_steps": 913, "total_steps": 1080, "loss": 0.0203, "lr": 2.89226268044083e-06, "epoch": 16.605504587155963, "percentage": 84.54, "elapsed_time": "4:23:42", "remaining_time": "0:48:14", "throughput": 2368.44, "total_tokens": 37474624} {"current_steps": 914, "total_steps": 1080, "loss": 0.0187, "lr": 2.858402248942349e-06, "epoch": 16.623853211009173, "percentage": 84.63, "elapsed_time": "4:23:57", "remaining_time": "0:47:56", "throughput": 2368.49, "total_tokens": 37511824} {"current_steps": 915, "total_steps": 1080, "loss": 0.0191, "lr": 2.8247291705444575e-06, "epoch": 16.642201834862384, "percentage": 84.72, "elapsed_time": "4:24:13", "remaining_time": "0:47:38", "throughput": 2368.57, "total_tokens": 37550216} {"current_steps": 916, "total_steps": 1080, "loss": 0.017, "lr": 2.7912437301749026e-06, "epoch": 16.660550458715598, "percentage": 84.81, "elapsed_time": "4:24:35", "remaining_time": "0:47:22", "throughput": 2368.44, "total_tokens": 37600240} {"current_steps": 917, "total_steps": 1080, "loss": 0.0231, "lr": 2.7579462111737065e-06, "epoch": 16.678899082568808, "percentage": 84.91, "elapsed_time": "4:24:54", "remaining_time": "0:47:05", "throughput": 2368.32, "total_tokens": 37642608} {"current_steps": 918, "total_steps": 1080, "loss": 0.0227, "lr": 2.7248368952908053e-06, "epoch": 16.69724770642202, "percentage": 85.0, "elapsed_time": "4:25:11", "remaining_time": "0:46:47", "throughput": 2368.47, "total_tokens": 37684840} {"current_steps": 919, "total_steps": 1080, "loss": 0.0167, "lr": 2.6919160626836166e-06, "epoch": 16.71559633027523, "percentage": 85.09, "elapsed_time": "4:25:26", "remaining_time": "0:46:30", "throughput": 2368.27, "total_tokens": 37718968} {"current_steps": 920, "total_steps": 1080, "loss": 0.0307, "lr": 2.659183991914696e-06, "epoch": 16.73394495412844, "percentage": 85.19, "elapsed_time": "4:25:47", "remaining_time": "0:46:13", "throughput": 2368.23, "total_tokens": 37767744} {"current_steps": 921, "total_steps": 1080, "loss": 0.0219, "lr": 2.6266409599493753e-06, "epoch": 16.75229357798165, "percentage": 85.28, "elapsed_time": "4:26:08", "remaining_time": "0:45:56", "throughput": 2368.17, "total_tokens": 37815432} {"current_steps": 922, "total_steps": 1080, "loss": 0.0175, "lr": 2.5942872421534146e-06, "epoch": 16.770642201834864, "percentage": 85.37, "elapsed_time": "4:26:27", "remaining_time": "0:45:39", "throughput": 2368.15, "total_tokens": 37859656} {"current_steps": 923, "total_steps": 1080, "loss": 0.0212, "lr": 2.5621231122906873e-06, "epoch": 16.788990825688074, "percentage": 85.46, "elapsed_time": "4:26:39", "remaining_time": "0:45:21", "throughput": 2368.27, "total_tokens": 37891816} {"current_steps": 924, "total_steps": 1080, "loss": 0.0205, "lr": 2.5301488425208296e-06, "epoch": 16.807339449541285, "percentage": 85.56, "elapsed_time": "4:26:56", "remaining_time": "0:45:04", "throughput": 2368.21, "total_tokens": 37930184} {"current_steps": 925, "total_steps": 1080, "loss": 0.0332, "lr": 2.4983647033969714e-06, "epoch": 16.825688073394495, "percentage": 85.65, "elapsed_time": "4:27:20", "remaining_time": "0:44:47", "throughput": 2367.9, "total_tokens": 37982736} {"current_steps": 926, "total_steps": 1080, "loss": 0.0177, "lr": 2.4667709638634434e-06, "epoch": 16.844036697247706, "percentage": 85.74, "elapsed_time": "4:27:36", "remaining_time": "0:44:30", "throughput": 2368.0, "total_tokens": 38022992} {"current_steps": 927, "total_steps": 1080, "loss": 0.0187, "lr": 2.43536789125349e-06, "epoch": 16.862385321100916, "percentage": 85.83, "elapsed_time": "4:27:55", "remaining_time": "0:44:13", "throughput": 2368.2, "total_tokens": 38070776} {"current_steps": 928, "total_steps": 1080, "loss": 0.0266, "lr": 2.4041557512869878e-06, "epoch": 16.88073394495413, "percentage": 85.93, "elapsed_time": "4:28:18", "remaining_time": "0:43:56", "throughput": 2368.1, "total_tokens": 38122544} {"current_steps": 929, "total_steps": 1080, "loss": 0.0179, "lr": 2.3731348080682504e-06, "epoch": 16.89908256880734, "percentage": 86.02, "elapsed_time": "4:28:33", "remaining_time": "0:43:39", "throughput": 2368.21, "total_tokens": 38160680} {"current_steps": 930, "total_steps": 1080, "loss": 0.0176, "lr": 2.3423053240837515e-06, "epoch": 16.91743119266055, "percentage": 86.11, "elapsed_time": "4:28:51", "remaining_time": "0:43:21", "throughput": 2368.12, "total_tokens": 38200720} {"current_steps": 931, "total_steps": 1080, "loss": 0.0196, "lr": 2.3116675601999094e-06, "epoch": 16.93577981651376, "percentage": 86.2, "elapsed_time": "4:29:05", "remaining_time": "0:43:04", "throughput": 2368.41, "total_tokens": 38240296} {"current_steps": 932, "total_steps": 1080, "loss": 0.0275, "lr": 2.281221775660894e-06, "epoch": 16.954128440366972, "percentage": 86.3, "elapsed_time": "4:29:35", "remaining_time": "0:42:48", "throughput": 2367.81, "total_tokens": 38299672} {"current_steps": 933, "total_steps": 1080, "loss": 0.02, "lr": 2.2509682280864224e-06, "epoch": 16.972477064220183, "percentage": 86.39, "elapsed_time": "4:29:57", "remaining_time": "0:42:31", "throughput": 2367.72, "total_tokens": 38350408} {"current_steps": 934, "total_steps": 1080, "loss": 0.0179, "lr": 2.2209071734695746e-06, "epoch": 16.990825688073393, "percentage": 86.48, "elapsed_time": "4:30:12", "remaining_time": "0:42:14", "throughput": 2367.7, "total_tokens": 38386312} {"current_steps": 935, "total_steps": 1080, "loss": 0.0217, "lr": 2.1910388661746493e-06, "epoch": 17.0, "percentage": 86.57, "elapsed_time": "4:30:19", "remaining_time": "0:41:55", "throughput": 2367.82, "total_tokens": 38404496} {"current_steps": 936, "total_steps": 1080, "loss": 0.0216, "lr": 2.1613635589349756e-06, "epoch": 17.01834862385321, "percentage": 86.67, "elapsed_time": "4:30:34", "remaining_time": "0:41:37", "throughput": 2367.83, "total_tokens": 38440632} {"current_steps": 937, "total_steps": 1080, "loss": 0.0149, "lr": 2.131881502850824e-06, "epoch": 17.03669724770642, "percentage": 86.76, "elapsed_time": "4:30:51", "remaining_time": "0:41:20", "throughput": 2367.72, "total_tokens": 38480008} {"current_steps": 938, "total_steps": 1080, "loss": 0.0205, "lr": 2.1025929473872274e-06, "epoch": 17.05504587155963, "percentage": 86.85, "elapsed_time": "4:31:09", "remaining_time": "0:41:02", "throughput": 2367.82, "total_tokens": 38523112} {"current_steps": 939, "total_steps": 1080, "loss": 0.025, "lr": 2.073498140371899e-06, "epoch": 17.073394495412845, "percentage": 86.94, "elapsed_time": "4:31:27", "remaining_time": "0:40:45", "throughput": 2367.77, "total_tokens": 38564512} {"current_steps": 940, "total_steps": 1080, "loss": 0.0269, "lr": 2.044597327993153e-06, "epoch": 17.091743119266056, "percentage": 87.04, "elapsed_time": "4:31:41", "remaining_time": "0:40:27", "throughput": 2367.67, "total_tokens": 38595896} {"current_steps": 941, "total_steps": 1080, "loss": 0.0183, "lr": 2.0158907547977722e-06, "epoch": 17.110091743119266, "percentage": 87.13, "elapsed_time": "4:31:53", "remaining_time": "0:40:09", "throughput": 2367.83, "total_tokens": 38628184} {"current_steps": 942, "total_steps": 1080, "loss": 0.0283, "lr": 1.9873786636889906e-06, "epoch": 17.128440366972477, "percentage": 87.22, "elapsed_time": "4:32:12", "remaining_time": "0:39:52", "throughput": 2367.56, "total_tokens": 38667296} {"current_steps": 943, "total_steps": 1080, "loss": 0.0135, "lr": 1.9590612959244055e-06, "epoch": 17.146788990825687, "percentage": 87.31, "elapsed_time": "4:32:27", "remaining_time": "0:39:35", "throughput": 2367.72, "total_tokens": 38707024} {"current_steps": 944, "total_steps": 1080, "loss": 0.0242, "lr": 1.9309388911139426e-06, "epoch": 17.165137614678898, "percentage": 87.41, "elapsed_time": "4:32:44", "remaining_time": "0:39:17", "throughput": 2367.83, "total_tokens": 38748056} {"current_steps": 945, "total_steps": 1080, "loss": 0.0166, "lr": 1.9030116872178316e-06, "epoch": 17.18348623853211, "percentage": 87.5, "elapsed_time": "4:33:00", "remaining_time": "0:39:00", "throughput": 2367.88, "total_tokens": 38786744} {"current_steps": 946, "total_steps": 1080, "loss": 0.0219, "lr": 1.8752799205445982e-06, "epoch": 17.201834862385322, "percentage": 87.59, "elapsed_time": "4:33:23", "remaining_time": "0:38:43", "throughput": 2367.84, "total_tokens": 38840712} {"current_steps": 947, "total_steps": 1080, "loss": 0.0189, "lr": 1.8477438257490543e-06, "epoch": 17.220183486238533, "percentage": 87.69, "elapsed_time": "4:33:35", "remaining_time": "0:38:25", "throughput": 2367.88, "total_tokens": 38871016} {"current_steps": 948, "total_steps": 1080, "loss": 0.0141, "lr": 1.8204036358303173e-06, "epoch": 17.238532110091743, "percentage": 87.78, "elapsed_time": "4:33:55", "remaining_time": "0:38:08", "throughput": 2368.05, "total_tokens": 38919976} {"current_steps": 949, "total_steps": 1080, "loss": 0.0145, "lr": 1.793259582129836e-06, "epoch": 17.256880733944953, "percentage": 87.87, "elapsed_time": "4:34:15", "remaining_time": "0:37:51", "throughput": 2368.36, "total_tokens": 38973000} {"current_steps": 950, "total_steps": 1080, "loss": 0.0195, "lr": 1.7663118943294366e-06, "epoch": 17.275229357798164, "percentage": 87.96, "elapsed_time": "4:34:39", "remaining_time": "0:37:35", "throughput": 2368.26, "total_tokens": 39027080} {"current_steps": 951, "total_steps": 1080, "loss": 0.0214, "lr": 1.7395608004493886e-06, "epoch": 17.293577981651374, "percentage": 88.06, "elapsed_time": "4:34:51", "remaining_time": "0:37:16", "throughput": 2368.29, "total_tokens": 39055792} {"current_steps": 952, "total_steps": 1080, "loss": 0.0212, "lr": 1.713006526846439e-06, "epoch": 17.31192660550459, "percentage": 88.15, "elapsed_time": "4:35:13", "remaining_time": "0:37:00", "throughput": 2368.35, "total_tokens": 39108640} {"current_steps": 953, "total_steps": 1080, "loss": 0.0225, "lr": 1.686649298211951e-06, "epoch": 17.3302752293578, "percentage": 88.24, "elapsed_time": "4:35:33", "remaining_time": "0:36:43", "throughput": 2368.08, "total_tokens": 39152080} {"current_steps": 954, "total_steps": 1080, "loss": 0.0148, "lr": 1.6604893375699594e-06, "epoch": 17.34862385321101, "percentage": 88.33, "elapsed_time": "4:35:52", "remaining_time": "0:36:26", "throughput": 2368.2, "total_tokens": 39199992} {"current_steps": 955, "total_steps": 1080, "loss": 0.019, "lr": 1.6345268662752906e-06, "epoch": 17.36697247706422, "percentage": 88.43, "elapsed_time": "4:36:07", "remaining_time": "0:36:08", "throughput": 2368.44, "total_tokens": 39239008} {"current_steps": 956, "total_steps": 1080, "loss": 0.0187, "lr": 1.6087621040117157e-06, "epoch": 17.38532110091743, "percentage": 88.52, "elapsed_time": "4:36:22", "remaining_time": "0:35:50", "throughput": 2368.41, "total_tokens": 39274760} {"current_steps": 957, "total_steps": 1080, "loss": 0.0191, "lr": 1.5831952687900608e-06, "epoch": 17.40366972477064, "percentage": 88.61, "elapsed_time": "4:36:36", "remaining_time": "0:35:33", "throughput": 2368.37, "total_tokens": 39306592} {"current_steps": 958, "total_steps": 1080, "loss": 0.0192, "lr": 1.5578265769463806e-06, "epoch": 17.422018348623855, "percentage": 88.7, "elapsed_time": "4:36:50", "remaining_time": "0:35:15", "throughput": 2368.56, "total_tokens": 39343144} {"current_steps": 959, "total_steps": 1080, "loss": 0.0205, "lr": 1.5326562431401153e-06, "epoch": 17.440366972477065, "percentage": 88.8, "elapsed_time": "4:37:08", "remaining_time": "0:34:58", "throughput": 2368.26, "total_tokens": 39381656} {"current_steps": 960, "total_steps": 1080, "loss": 0.021, "lr": 1.5076844803522922e-06, "epoch": 17.458715596330276, "percentage": 88.89, "elapsed_time": "4:37:26", "remaining_time": "0:34:40", "throughput": 2368.13, "total_tokens": 39421896} {"current_steps": 961, "total_steps": 1080, "loss": 0.0214, "lr": 1.482911499883699e-06, "epoch": 17.477064220183486, "percentage": 88.98, "elapsed_time": "4:37:40", "remaining_time": "0:34:23", "throughput": 2368.37, "total_tokens": 39459352} {"current_steps": 962, "total_steps": 1080, "loss": 0.0146, "lr": 1.4583375113531195e-06, "epoch": 17.495412844036696, "percentage": 89.07, "elapsed_time": "4:37:54", "remaining_time": "0:34:05", "throughput": 2368.49, "total_tokens": 39492800} {"current_steps": 963, "total_steps": 1080, "loss": 0.0165, "lr": 1.4339627226955392e-06, "epoch": 17.513761467889907, "percentage": 89.17, "elapsed_time": "4:38:12", "remaining_time": "0:33:48", "throughput": 2368.55, "total_tokens": 39537000} {"current_steps": 964, "total_steps": 1080, "loss": 0.0232, "lr": 1.4097873401604122e-06, "epoch": 17.53211009174312, "percentage": 89.26, "elapsed_time": "4:38:27", "remaining_time": "0:33:30", "throughput": 2368.75, "total_tokens": 39576288} {"current_steps": 965, "total_steps": 1080, "loss": 0.0142, "lr": 1.3858115683098832e-06, "epoch": 17.55045871559633, "percentage": 89.35, "elapsed_time": "4:38:42", "remaining_time": "0:33:12", "throughput": 2368.84, "total_tokens": 39612936} {"current_steps": 966, "total_steps": 1080, "loss": 0.0202, "lr": 1.362035610017079e-06, "epoch": 17.568807339449542, "percentage": 89.44, "elapsed_time": "4:38:57", "remaining_time": "0:32:55", "throughput": 2369.07, "total_tokens": 39651632} {"current_steps": 967, "total_steps": 1080, "loss": 0.0201, "lr": 1.3384596664643922e-06, "epoch": 17.587155963302752, "percentage": 89.54, "elapsed_time": "4:39:24", "remaining_time": "0:32:39", "throughput": 2368.92, "total_tokens": 39713824} {"current_steps": 968, "total_steps": 1080, "loss": 0.0169, "lr": 1.31508393714177e-06, "epoch": 17.605504587155963, "percentage": 89.63, "elapsed_time": "4:39:41", "remaining_time": "0:32:21", "throughput": 2368.94, "total_tokens": 39753616} {"current_steps": 969, "total_steps": 1080, "loss": 0.0284, "lr": 1.291908619845017e-06, "epoch": 17.623853211009173, "percentage": 89.72, "elapsed_time": "4:39:55", "remaining_time": "0:32:03", "throughput": 2369.04, "total_tokens": 39789208} {"current_steps": 970, "total_steps": 1080, "loss": 0.0219, "lr": 1.2689339106741527e-06, "epoch": 17.642201834862384, "percentage": 89.81, "elapsed_time": "4:40:09", "remaining_time": "0:31:46", "throughput": 2369.14, "total_tokens": 39823072} {"current_steps": 971, "total_steps": 1080, "loss": 0.0221, "lr": 1.2461600040317212e-06, "epoch": 17.660550458715598, "percentage": 89.91, "elapsed_time": "4:40:21", "remaining_time": "0:31:28", "throughput": 2369.18, "total_tokens": 39853600} {"current_steps": 972, "total_steps": 1080, "loss": 0.0203, "lr": 1.2235870926211619e-06, "epoch": 17.678899082568808, "percentage": 90.0, "elapsed_time": "4:40:35", "remaining_time": "0:31:10", "throughput": 2369.39, "total_tokens": 39890080} {"current_steps": 973, "total_steps": 1080, "loss": 0.0258, "lr": 1.2012153674451715e-06, "epoch": 17.69724770642202, "percentage": 90.09, "elapsed_time": "4:40:53", "remaining_time": "0:30:53", "throughput": 2369.19, "total_tokens": 39929208} {"current_steps": 974, "total_steps": 1080, "loss": 0.0212, "lr": 1.1790450178040951e-06, "epoch": 17.71559633027523, "percentage": 90.19, "elapsed_time": "4:41:10", "remaining_time": "0:30:35", "throughput": 2369.2, "total_tokens": 39969344} {"current_steps": 975, "total_steps": 1080, "loss": 0.0188, "lr": 1.1570762312943295e-06, "epoch": 17.73394495412844, "percentage": 90.28, "elapsed_time": "4:41:26", "remaining_time": "0:30:18", "throughput": 2369.54, "total_tokens": 40012816} {"current_steps": 976, "total_steps": 1080, "loss": 0.0215, "lr": 1.1353091938067023e-06, "epoch": 17.75229357798165, "percentage": 90.37, "elapsed_time": "4:41:42", "remaining_time": "0:30:01", "throughput": 2369.58, "total_tokens": 40051096} {"current_steps": 977, "total_steps": 1080, "loss": 0.0173, "lr": 1.1137440895249457e-06, "epoch": 17.770642201834864, "percentage": 90.46, "elapsed_time": "4:41:56", "remaining_time": "0:29:43", "throughput": 2369.84, "total_tokens": 40090488} {"current_steps": 978, "total_steps": 1080, "loss": 0.0203, "lr": 1.0923811009241142e-06, "epoch": 17.788990825688074, "percentage": 90.56, "elapsed_time": "4:42:20", "remaining_time": "0:29:26", "throughput": 2369.83, "total_tokens": 40145176} {"current_steps": 979, "total_steps": 1080, "loss": 0.0246, "lr": 1.071220408769033e-06, "epoch": 17.807339449541285, "percentage": 90.65, "elapsed_time": "4:42:39", "remaining_time": "0:29:09", "throughput": 2369.74, "total_tokens": 40189416} {"current_steps": 980, "total_steps": 1080, "loss": 0.014, "lr": 1.0502621921127776e-06, "epoch": 17.825688073394495, "percentage": 90.74, "elapsed_time": "4:42:57", "remaining_time": "0:28:52", "throughput": 2370.1, "total_tokens": 40239272} {"current_steps": 981, "total_steps": 1080, "loss": 0.0239, "lr": 1.0295066282951738e-06, "epoch": 17.844036697247706, "percentage": 90.83, "elapsed_time": "4:43:20", "remaining_time": "0:28:35", "throughput": 2369.76, "total_tokens": 40288104} {"current_steps": 982, "total_steps": 1080, "loss": 0.0168, "lr": 1.0089538929412724e-06, "epoch": 17.862385321100916, "percentage": 90.93, "elapsed_time": "4:43:35", "remaining_time": "0:28:18", "throughput": 2369.71, "total_tokens": 40322904} {"current_steps": 983, "total_steps": 1080, "loss": 0.0169, "lr": 9.886041599598606e-07, "epoch": 17.88073394495413, "percentage": 91.02, "elapsed_time": "4:43:59", "remaining_time": "0:28:01", "throughput": 2369.33, "total_tokens": 40372536} {"current_steps": 984, "total_steps": 1080, "loss": 0.0188, "lr": 9.684576015420278e-07, "epoch": 17.89908256880734, "percentage": 91.11, "elapsed_time": "4:44:22", "remaining_time": "0:27:44", "throughput": 2369.43, "total_tokens": 40427408} {"current_steps": 985, "total_steps": 1080, "loss": 0.0238, "lr": 9.485143881596714e-07, "epoch": 17.91743119266055, "percentage": 91.2, "elapsed_time": "4:44:44", "remaining_time": "0:27:27", "throughput": 2369.28, "total_tokens": 40477568} {"current_steps": 986, "total_steps": 1080, "loss": 0.0215, "lr": 9.287746885640603e-07, "epoch": 17.93577981651376, "percentage": 91.3, "elapsed_time": "4:44:59", "remaining_time": "0:27:10", "throughput": 2369.59, "total_tokens": 40519224} {"current_steps": 987, "total_steps": 1080, "loss": 0.0188, "lr": 9.092386697844263e-07, "epoch": 17.954128440366972, "percentage": 91.39, "elapsed_time": "4:45:15", "remaining_time": "0:26:52", "throughput": 2369.81, "total_tokens": 40560640} {"current_steps": 988, "total_steps": 1080, "loss": 0.029, "lr": 8.899064971265276e-07, "epoch": 17.972477064220183, "percentage": 91.48, "elapsed_time": "4:45:37", "remaining_time": "0:26:35", "throughput": 2369.63, "total_tokens": 40609544} {"current_steps": 989, "total_steps": 1080, "loss": 0.0173, "lr": 8.707783341712656e-07, "epoch": 17.990825688073393, "percentage": 91.57, "elapsed_time": "4:45:52", "remaining_time": "0:26:18", "throughput": 2369.76, "total_tokens": 40646216} {"current_steps": 990, "total_steps": 1080, "loss": 0.0252, "lr": 8.51854342773295e-07, "epoch": 18.0, "percentage": 91.67, "elapsed_time": "4:45:59", "remaining_time": "0:25:59", "throughput": 2369.81, "total_tokens": 40663584} {"current_steps": 991, "total_steps": 1080, "loss": 0.0136, "lr": 8.331346830596498e-07, "epoch": 18.01834862385321, "percentage": 91.76, "elapsed_time": "4:46:18", "remaining_time": "0:25:42", "throughput": 2369.88, "total_tokens": 40711208} {"current_steps": 992, "total_steps": 1080, "loss": 0.0163, "lr": 8.146195134284052e-07, "epoch": 18.03669724770642, "percentage": 91.85, "elapsed_time": "4:46:34", "remaining_time": "0:25:25", "throughput": 2370.08, "total_tokens": 40752144} {"current_steps": 993, "total_steps": 1080, "loss": 0.0204, "lr": 7.963089905473092e-07, "epoch": 18.05504587155963, "percentage": 91.94, "elapsed_time": "4:46:54", "remaining_time": "0:25:08", "throughput": 2370.04, "total_tokens": 40798560} {"current_steps": 994, "total_steps": 1080, "loss": 0.0196, "lr": 7.782032693524816e-07, "epoch": 18.073394495412845, "percentage": 92.04, "elapsed_time": "4:47:07", "remaining_time": "0:24:50", "throughput": 2369.99, "total_tokens": 40829872} {"current_steps": 995, "total_steps": 1080, "loss": 0.0225, "lr": 7.603025030471e-07, "epoch": 18.091743119266056, "percentage": 92.13, "elapsed_time": "4:47:24", "remaining_time": "0:24:33", "throughput": 2369.88, "total_tokens": 40866712} {"current_steps": 996, "total_steps": 1080, "loss": 0.0152, "lr": 7.426068431000882e-07, "epoch": 18.110091743119266, "percentage": 92.22, "elapsed_time": "4:47:45", "remaining_time": "0:24:16", "throughput": 2369.84, "total_tokens": 40917200} {"current_steps": 997, "total_steps": 1080, "loss": 0.0176, "lr": 7.251164392448496e-07, "epoch": 18.128440366972477, "percentage": 92.31, "elapsed_time": "4:48:04", "remaining_time": "0:23:58", "throughput": 2369.9, "total_tokens": 40961592} {"current_steps": 998, "total_steps": 1080, "loss": 0.0215, "lr": 7.078314394779961e-07, "epoch": 18.146788990825687, "percentage": 92.41, "elapsed_time": "4:48:20", "remaining_time": "0:23:41", "throughput": 2369.73, "total_tokens": 40996304} {"current_steps": 999, "total_steps": 1080, "loss": 0.0196, "lr": 6.907519900580861e-07, "epoch": 18.165137614678898, "percentage": 92.5, "elapsed_time": "4:48:47", "remaining_time": "0:23:24", "throughput": 2369.26, "total_tokens": 41054400} {"current_steps": 1000, "total_steps": 1080, "loss": 0.0189, "lr": 6.738782355044049e-07, "epoch": 18.18348623853211, "percentage": 92.59, "elapsed_time": "4:49:11", "remaining_time": "0:23:08", "throughput": 2369.07, "total_tokens": 41106064} {"current_steps": 1001, "total_steps": 1080, "loss": 0.0186, "lr": 6.572103185957301e-07, "epoch": 18.201834862385322, "percentage": 92.69, "elapsed_time": "4:49:28", "remaining_time": "0:22:50", "throughput": 2369.22, "total_tokens": 41148920} {"current_steps": 1002, "total_steps": 1080, "loss": 0.022, "lr": 6.407483803691216e-07, "epoch": 18.220183486238533, "percentage": 92.78, "elapsed_time": "4:49:40", "remaining_time": "0:22:33", "throughput": 2369.07, "total_tokens": 41176536} {"current_steps": 1003, "total_steps": 1080, "loss": 0.0183, "lr": 6.244925601187363e-07, "epoch": 18.238532110091743, "percentage": 92.87, "elapsed_time": "4:49:59", "remaining_time": "0:22:15", "throughput": 2369.26, "total_tokens": 41223776} {"current_steps": 1004, "total_steps": 1080, "loss": 0.0182, "lr": 6.084429953946452e-07, "epoch": 18.256880733944953, "percentage": 92.96, "elapsed_time": "4:50:21", "remaining_time": "0:21:58", "throughput": 2369.13, "total_tokens": 41274976} {"current_steps": 1005, "total_steps": 1080, "loss": 0.0273, "lr": 5.925998220016659e-07, "epoch": 18.275229357798164, "percentage": 93.06, "elapsed_time": "4:50:33", "remaining_time": "0:21:41", "throughput": 2369.04, "total_tokens": 41300896} {"current_steps": 1006, "total_steps": 1080, "loss": 0.0153, "lr": 5.769631739982267e-07, "epoch": 18.293577981651374, "percentage": 93.15, "elapsed_time": "4:50:49", "remaining_time": "0:21:23", "throughput": 2369.01, "total_tokens": 41338840} {"current_steps": 1007, "total_steps": 1080, "loss": 0.0172, "lr": 5.615331836952121e-07, "epoch": 18.31192660550459, "percentage": 93.24, "elapsed_time": "4:51:06", "remaining_time": "0:21:06", "throughput": 2368.81, "total_tokens": 41374664} {"current_steps": 1008, "total_steps": 1080, "loss": 0.0141, "lr": 5.463099816548579e-07, "epoch": 18.3302752293578, "percentage": 93.33, "elapsed_time": "4:51:21", "remaining_time": "0:20:48", "throughput": 2368.98, "total_tokens": 41413920} {"current_steps": 1009, "total_steps": 1080, "loss": 0.0343, "lr": 5.312936966896498e-07, "epoch": 18.34862385321101, "percentage": 93.43, "elapsed_time": "4:51:42", "remaining_time": "0:20:31", "throughput": 2368.87, "total_tokens": 41461272} {"current_steps": 1010, "total_steps": 1080, "loss": 0.0217, "lr": 5.164844558612131e-07, "epoch": 18.36697247706422, "percentage": 93.52, "elapsed_time": "4:51:59", "remaining_time": "0:20:14", "throughput": 2368.93, "total_tokens": 41501328} {"current_steps": 1011, "total_steps": 1080, "loss": 0.0208, "lr": 5.018823844792603e-07, "epoch": 18.38532110091743, "percentage": 93.61, "elapsed_time": "4:52:12", "remaining_time": "0:19:56", "throughput": 2368.98, "total_tokens": 41534096} {"current_steps": 1012, "total_steps": 1080, "loss": 0.0189, "lr": 4.874876061005173e-07, "epoch": 18.40366972477064, "percentage": 93.7, "elapsed_time": "4:52:30", "remaining_time": "0:19:39", "throughput": 2369.02, "total_tokens": 41576592} {"current_steps": 1013, "total_steps": 1080, "loss": 0.0128, "lr": 4.7330024252768555e-07, "epoch": 18.422018348623855, "percentage": 93.8, "elapsed_time": "4:52:50", "remaining_time": "0:19:22", "throughput": 2368.99, "total_tokens": 41624000} {"current_steps": 1014, "total_steps": 1080, "loss": 0.0231, "lr": 4.5932041380840065e-07, "epoch": 18.440366972477065, "percentage": 93.89, "elapsed_time": "4:53:03", "remaining_time": "0:19:04", "throughput": 2369.01, "total_tokens": 41656024} {"current_steps": 1015, "total_steps": 1080, "loss": 0.0154, "lr": 4.4554823823423354e-07, "epoch": 18.458715596330276, "percentage": 93.98, "elapsed_time": "4:53:22", "remaining_time": "0:18:47", "throughput": 2368.88, "total_tokens": 41697984} {"current_steps": 1016, "total_steps": 1080, "loss": 0.0169, "lr": 4.319838323396691e-07, "epoch": 18.477064220183486, "percentage": 94.07, "elapsed_time": "4:53:39", "remaining_time": "0:18:29", "throughput": 2369.01, "total_tokens": 41740560} {"current_steps": 1017, "total_steps": 1080, "loss": 0.0179, "lr": 4.1862731090113736e-07, "epoch": 18.495412844036696, "percentage": 94.17, "elapsed_time": "4:53:57", "remaining_time": "0:18:12", "throughput": 2369.05, "total_tokens": 41783512} {"current_steps": 1018, "total_steps": 1080, "loss": 0.018, "lr": 4.05478786936031e-07, "epoch": 18.513761467889907, "percentage": 94.26, "elapsed_time": "4:54:13", "remaining_time": "0:17:55", "throughput": 2369.08, "total_tokens": 41822144} {"current_steps": 1019, "total_steps": 1080, "loss": 0.0157, "lr": 3.9253837170175887e-07, "epoch": 18.53211009174312, "percentage": 94.35, "elapsed_time": "4:54:29", "remaining_time": "0:17:37", "throughput": 2369.14, "total_tokens": 41860344} {"current_steps": 1020, "total_steps": 1080, "loss": 0.0278, "lr": 3.7980617469479953e-07, "epoch": 18.55045871559633, "percentage": 94.44, "elapsed_time": "4:54:52", "remaining_time": "0:17:20", "throughput": 2369.16, "total_tokens": 41915536} {"current_steps": 1021, "total_steps": 1080, "loss": 0.0179, "lr": 3.672823036497658e-07, "epoch": 18.568807339449542, "percentage": 94.54, "elapsed_time": "4:55:10", "remaining_time": "0:17:03", "throughput": 2369.21, "total_tokens": 41961056} {"current_steps": 1022, "total_steps": 1080, "loss": 0.0203, "lr": 3.5496686453850846e-07, "epoch": 18.587155963302752, "percentage": 94.63, "elapsed_time": "4:55:27", "remaining_time": "0:16:46", "throughput": 2369.14, "total_tokens": 41998240} {"current_steps": 1023, "total_steps": 1080, "loss": 0.0176, "lr": 3.428599615692141e-07, "epoch": 18.605504587155963, "percentage": 94.72, "elapsed_time": "4:55:42", "remaining_time": "0:16:28", "throughput": 2369.07, "total_tokens": 42032136} {"current_steps": 1024, "total_steps": 1080, "loss": 0.0185, "lr": 3.309616971855195e-07, "epoch": 18.623853211009173, "percentage": 94.81, "elapsed_time": "4:56:01", "remaining_time": "0:16:11", "throughput": 2369.23, "total_tokens": 42079960} {"current_steps": 1025, "total_steps": 1080, "loss": 0.0148, "lr": 3.192721720656489e-07, "epoch": 18.642201834862384, "percentage": 94.91, "elapsed_time": "4:56:17", "remaining_time": "0:15:53", "throughput": 2369.32, "total_tokens": 42120432} {"current_steps": 1026, "total_steps": 1080, "loss": 0.0224, "lr": 3.077914851215585e-07, "epoch": 18.660550458715598, "percentage": 95.0, "elapsed_time": "4:56:37", "remaining_time": "0:15:36", "throughput": 2369.45, "total_tokens": 42171464} {"current_steps": 1027, "total_steps": 1080, "loss": 0.0231, "lr": 2.965197334981018e-07, "epoch": 18.678899082568808, "percentage": 95.09, "elapsed_time": "4:56:56", "remaining_time": "0:15:19", "throughput": 2369.42, "total_tokens": 42213608} {"current_steps": 1028, "total_steps": 1080, "loss": 0.0167, "lr": 2.8545701257221e-07, "epoch": 18.69724770642202, "percentage": 95.19, "elapsed_time": "4:57:13", "remaining_time": "0:15:02", "throughput": 2369.46, "total_tokens": 42255512} {"current_steps": 1029, "total_steps": 1080, "loss": 0.0202, "lr": 2.746034159520794e-07, "epoch": 18.71559633027523, "percentage": 95.28, "elapsed_time": "4:57:29", "remaining_time": "0:14:44", "throughput": 2369.39, "total_tokens": 42292752} {"current_steps": 1030, "total_steps": 1080, "loss": 0.0209, "lr": 2.6395903547638825e-07, "epoch": 18.73394495412844, "percentage": 95.37, "elapsed_time": "4:57:41", "remaining_time": "0:14:27", "throughput": 2369.47, "total_tokens": 42323392} {"current_steps": 1031, "total_steps": 1080, "loss": 0.0222, "lr": 2.5352396121350596e-07, "epoch": 18.75229357798165, "percentage": 95.46, "elapsed_time": "4:57:58", "remaining_time": "0:14:09", "throughput": 2369.61, "total_tokens": 42364656} {"current_steps": 1032, "total_steps": 1080, "loss": 0.0244, "lr": 2.4329828146074095e-07, "epoch": 18.770642201834864, "percentage": 95.56, "elapsed_time": "4:58:19", "remaining_time": "0:13:52", "throughput": 2369.14, "total_tokens": 42406144} {"current_steps": 1033, "total_steps": 1080, "loss": 0.0154, "lr": 2.3328208274359942e-07, "epoch": 18.788990825688074, "percentage": 95.65, "elapsed_time": "4:58:37", "remaining_time": "0:13:35", "throughput": 2369.27, "total_tokens": 42451744} {"current_steps": 1034, "total_steps": 1080, "loss": 0.022, "lr": 2.234754498150332e-07, "epoch": 18.807339449541285, "percentage": 95.74, "elapsed_time": "4:59:00", "remaining_time": "0:13:18", "throughput": 2369.45, "total_tokens": 42508464} {"current_steps": 1035, "total_steps": 1080, "loss": 0.0182, "lr": 2.1387846565474045e-07, "epoch": 18.825688073394495, "percentage": 95.83, "elapsed_time": "4:59:15", "remaining_time": "0:13:00", "throughput": 2369.55, "total_tokens": 42545880} {"current_steps": 1036, "total_steps": 1080, "loss": 0.023, "lr": 2.0449121146845774e-07, "epoch": 18.844036697247706, "percentage": 95.93, "elapsed_time": "4:59:35", "remaining_time": "0:12:43", "throughput": 2369.67, "total_tokens": 42596632} {"current_steps": 1037, "total_steps": 1080, "loss": 0.021, "lr": 1.9531376668727176e-07, "epoch": 18.862385321100916, "percentage": 96.02, "elapsed_time": "4:59:51", "remaining_time": "0:12:26", "throughput": 2369.73, "total_tokens": 42634536} {"current_steps": 1038, "total_steps": 1080, "loss": 0.0275, "lr": 1.8634620896695043e-07, "epoch": 18.88073394495413, "percentage": 96.11, "elapsed_time": "5:00:04", "remaining_time": "0:12:08", "throughput": 2369.87, "total_tokens": 42667304} {"current_steps": 1039, "total_steps": 1080, "loss": 0.0229, "lr": 1.7758861418727678e-07, "epoch": 18.89908256880734, "percentage": 96.2, "elapsed_time": "5:00:24", "remaining_time": "0:11:51", "throughput": 2369.82, "total_tokens": 42714696} {"current_steps": 1040, "total_steps": 1080, "loss": 0.0265, "lr": 1.6904105645142444e-07, "epoch": 18.91743119266055, "percentage": 96.3, "elapsed_time": "5:00:44", "remaining_time": "0:11:34", "throughput": 2369.76, "total_tokens": 42761616} {"current_steps": 1041, "total_steps": 1080, "loss": 0.0203, "lr": 1.607036080853136e-07, "epoch": 18.93577981651376, "percentage": 96.39, "elapsed_time": "5:00:59", "remaining_time": "0:11:16", "throughput": 2369.82, "total_tokens": 42797176} {"current_steps": 1042, "total_steps": 1080, "loss": 0.0218, "lr": 1.5257633963700058e-07, "epoch": 18.954128440366972, "percentage": 96.48, "elapsed_time": "5:01:14", "remaining_time": "0:10:59", "throughput": 2369.94, "total_tokens": 42836136} {"current_steps": 1043, "total_steps": 1080, "loss": 0.015, "lr": 1.4465931987609482e-07, "epoch": 18.972477064220183, "percentage": 96.57, "elapsed_time": "5:01:24", "remaining_time": "0:10:41", "throughput": 2369.94, "total_tokens": 42860296} {"current_steps": 1044, "total_steps": 1080, "loss": 0.0181, "lr": 1.3695261579316777e-07, "epoch": 18.990825688073393, "percentage": 96.67, "elapsed_time": "5:01:41", "remaining_time": "0:10:24", "throughput": 2370.05, "total_tokens": 42901256} {"current_steps": 1045, "total_steps": 1080, "loss": 0.0173, "lr": 1.2945629259917546e-07, "epoch": 19.0, "percentage": 96.76, "elapsed_time": "5:01:50", "remaining_time": "0:10:06", "throughput": 2370.07, "total_tokens": 42922672} {"current_steps": 1046, "total_steps": 1080, "loss": 0.0292, "lr": 1.22170413724923e-07, "epoch": 19.01834862385321, "percentage": 96.85, "elapsed_time": "5:02:09", "remaining_time": "0:09:49", "throughput": 2369.83, "total_tokens": 42964176} {"current_steps": 1047, "total_steps": 1080, "loss": 0.0183, "lr": 1.1509504082052869e-07, "epoch": 19.03669724770642, "percentage": 96.94, "elapsed_time": "5:02:29", "remaining_time": "0:09:32", "throughput": 2369.87, "total_tokens": 43012560} {"current_steps": 1048, "total_steps": 1080, "loss": 0.0219, "lr": 1.0823023375489127e-07, "epoch": 19.05504587155963, "percentage": 97.04, "elapsed_time": "5:02:45", "remaining_time": "0:09:14", "throughput": 2369.73, "total_tokens": 43047752} {"current_steps": 1049, "total_steps": 1080, "loss": 0.0239, "lr": 1.0157605061517916e-07, "epoch": 19.073394495412845, "percentage": 97.13, "elapsed_time": "5:03:01", "remaining_time": "0:08:57", "throughput": 2369.76, "total_tokens": 43085720} {"current_steps": 1050, "total_steps": 1080, "loss": 0.0131, "lr": 9.513254770636137e-08, "epoch": 19.091743119266056, "percentage": 97.22, "elapsed_time": "5:03:20", "remaining_time": "0:08:40", "throughput": 2369.9, "total_tokens": 43133928} {"current_steps": 1051, "total_steps": 1080, "loss": 0.0195, "lr": 8.889977955071071e-08, "epoch": 19.110091743119266, "percentage": 97.31, "elapsed_time": "5:03:36", "remaining_time": "0:08:22", "throughput": 2370.02, "total_tokens": 43174440} {"current_steps": 1052, "total_steps": 1080, "loss": 0.0175, "lr": 8.28777988873486e-08, "epoch": 19.128440366972477, "percentage": 97.41, "elapsed_time": "5:03:54", "remaining_time": "0:08:05", "throughput": 2369.91, "total_tokens": 43214128} {"current_steps": 1053, "total_steps": 1080, "loss": 0.0194, "lr": 7.706665667180091e-08, "epoch": 19.146788990825687, "percentage": 97.5, "elapsed_time": "5:04:12", "remaining_time": "0:07:48", "throughput": 2369.81, "total_tokens": 43254824} {"current_steps": 1054, "total_steps": 1080, "loss": 0.0207, "lr": 7.14664020755651e-08, "epoch": 19.165137614678898, "percentage": 97.59, "elapsed_time": "5:04:26", "remaining_time": "0:07:30", "throughput": 2369.9, "total_tokens": 43290632} {"current_steps": 1055, "total_steps": 1080, "loss": 0.0195, "lr": 6.607708248569377e-08, "epoch": 19.18348623853211, "percentage": 97.69, "elapsed_time": "5:04:46", "remaining_time": "0:07:13", "throughput": 2370.04, "total_tokens": 43338720} {"current_steps": 1056, "total_steps": 1080, "loss": 0.0201, "lr": 6.089874350439506e-08, "epoch": 19.201834862385322, "percentage": 97.78, "elapsed_time": "5:05:03", "remaining_time": "0:06:55", "throughput": 2369.99, "total_tokens": 43378544} {"current_steps": 1057, "total_steps": 1080, "loss": 0.0179, "lr": 5.593142894864123e-08, "epoch": 19.220183486238533, "percentage": 97.87, "elapsed_time": "5:05:20", "remaining_time": "0:06:38", "throughput": 2369.95, "total_tokens": 43418136} {"current_steps": 1058, "total_steps": 1080, "loss": 0.0176, "lr": 5.117518084981621e-08, "epoch": 19.238532110091743, "percentage": 97.96, "elapsed_time": "5:05:34", "remaining_time": "0:06:21", "throughput": 2370.11, "total_tokens": 43455504} {"current_steps": 1059, "total_steps": 1080, "loss": 0.0232, "lr": 4.6630039453327e-08, "epoch": 19.256880733944953, "percentage": 98.06, "elapsed_time": "5:05:46", "remaining_time": "0:06:03", "throughput": 2370.16, "total_tokens": 43483904} {"current_steps": 1060, "total_steps": 1080, "loss": 0.0193, "lr": 4.229604321829561e-08, "epoch": 19.275229357798164, "percentage": 98.15, "elapsed_time": "5:06:04", "remaining_time": "0:05:46", "throughput": 2370.06, "total_tokens": 43525440} {"current_steps": 1061, "total_steps": 1080, "loss": 0.0171, "lr": 3.817322881721763e-08, "epoch": 19.293577981651374, "percentage": 98.24, "elapsed_time": "5:06:23", "remaining_time": "0:05:29", "throughput": 2369.99, "total_tokens": 43567648} {"current_steps": 1062, "total_steps": 1080, "loss": 0.0157, "lr": 3.426163113565417e-08, "epoch": 19.31192660550459, "percentage": 98.33, "elapsed_time": "5:06:43", "remaining_time": "0:05:11", "throughput": 2370.0, "total_tokens": 43616600} {"current_steps": 1063, "total_steps": 1080, "loss": 0.0215, "lr": 3.056128327193486e-08, "epoch": 19.3302752293578, "percentage": 98.43, "elapsed_time": "5:06:58", "remaining_time": "0:04:54", "throughput": 2369.82, "total_tokens": 43649488} {"current_steps": 1064, "total_steps": 1080, "loss": 0.0232, "lr": 2.7072216536885853e-08, "epoch": 19.34862385321101, "percentage": 98.52, "elapsed_time": "5:07:20", "remaining_time": "0:04:37", "throughput": 2369.56, "total_tokens": 43695504} {"current_steps": 1065, "total_steps": 1080, "loss": 0.0231, "lr": 2.3794460453555047e-08, "epoch": 19.36697247706422, "percentage": 98.61, "elapsed_time": "5:07:37", "remaining_time": "0:04:19", "throughput": 2369.4, "total_tokens": 43733384} {"current_steps": 1066, "total_steps": 1080, "loss": 0.0206, "lr": 2.0728042756967824e-08, "epoch": 19.38532110091743, "percentage": 98.7, "elapsed_time": "5:07:53", "remaining_time": "0:04:02", "throughput": 2369.71, "total_tokens": 43777400} {"current_steps": 1067, "total_steps": 1080, "loss": 0.0246, "lr": 1.7872989393888373e-08, "epoch": 19.40366972477064, "percentage": 98.8, "elapsed_time": "5:08:15", "remaining_time": "0:03:45", "throughput": 2369.56, "total_tokens": 43826152} {"current_steps": 1068, "total_steps": 1080, "loss": 0.0162, "lr": 1.522932452260595e-08, "epoch": 19.422018348623855, "percentage": 98.89, "elapsed_time": "5:08:35", "remaining_time": "0:03:28", "throughput": 2369.64, "total_tokens": 43875264} {"current_steps": 1069, "total_steps": 1080, "loss": 0.0149, "lr": 1.2797070512726716e-08, "epoch": 19.440366972477065, "percentage": 98.98, "elapsed_time": "5:08:53", "remaining_time": "0:03:10", "throughput": 2369.64, "total_tokens": 43917752} {"current_steps": 1070, "total_steps": 1080, "loss": 0.0209, "lr": 1.0576247944985018e-08, "epoch": 19.458715596330276, "percentage": 99.07, "elapsed_time": "5:09:13", "remaining_time": "0:02:53", "throughput": 2369.79, "total_tokens": 43968216} {"current_steps": 1071, "total_steps": 1080, "loss": 0.0205, "lr": 8.566875611068504e-09, "epoch": 19.477064220183486, "percentage": 99.17, "elapsed_time": "5:09:26", "remaining_time": "0:02:36", "throughput": 2369.7, "total_tokens": 43997248} {"current_steps": 1072, "total_steps": 1080, "loss": 0.0128, "lr": 6.768970513457151e-09, "epoch": 19.495412844036696, "percentage": 99.26, "elapsed_time": "5:09:41", "remaining_time": "0:02:18", "throughput": 2369.92, "total_tokens": 44036296} {"current_steps": 1073, "total_steps": 1080, "loss": 0.0267, "lr": 5.182547865290044e-09, "epoch": 19.513761467889907, "percentage": 99.35, "elapsed_time": "5:10:00", "remaining_time": "0:02:01", "throughput": 2370.15, "total_tokens": 44084872} {"current_steps": 1074, "total_steps": 1080, "loss": 0.0196, "lr": 3.807621090218261e-09, "epoch": 19.53211009174312, "percentage": 99.44, "elapsed_time": "5:10:18", "remaining_time": "0:01:44", "throughput": 2370.22, "total_tokens": 44129072} {"current_steps": 1075, "total_steps": 1080, "loss": 0.0208, "lr": 2.6442018223132857e-09, "epoch": 19.55045871559633, "percentage": 99.54, "elapsed_time": "5:10:35", "remaining_time": "0:01:26", "throughput": 2370.05, "total_tokens": 44167088} {"current_steps": 1076, "total_steps": 1080, "loss": 0.0177, "lr": 1.692299905944883e-09, "epoch": 19.568807339449542, "percentage": 99.63, "elapsed_time": "5:10:51", "remaining_time": "0:01:09", "throughput": 2370.01, "total_tokens": 44204544} {"current_steps": 1077, "total_steps": 1080, "loss": 0.0178, "lr": 9.51923395717258e-10, "epoch": 19.587155963302752, "percentage": 99.72, "elapsed_time": "5:11:06", "remaining_time": "0:00:51", "throughput": 2370.23, "total_tokens": 44243296} {"current_steps": 1078, "total_steps": 1080, "loss": 0.0254, "lr": 4.2307855639411865e-10, "epoch": 19.605504587155963, "percentage": 99.81, "elapsed_time": "5:11:25", "remaining_time": "0:00:34", "throughput": 2370.24, "total_tokens": 44289840} {"current_steps": 1079, "total_steps": 1080, "loss": 0.0215, "lr": 1.0576986284316359e-10, "epoch": 19.623853211009173, "percentage": 99.91, "elapsed_time": "5:11:43", "remaining_time": "0:00:17", "throughput": 2370.33, "total_tokens": 44334688} {"current_steps": 1080, "total_steps": 1080, "loss": 0.0131, "lr": 0.0, "epoch": 19.642201834862384, "percentage": 100.0, "elapsed_time": "5:12:04", "remaining_time": "0:00:00", "throughput": 2370.4, "total_tokens": 44384416} {"current_steps": 1080, "total_steps": 1080, "epoch": 19.642201834862384, "percentage": 100.0, "elapsed_time": "5:12:06", "remaining_time": "0:00:00", "throughput": 2370.17, "total_tokens": 44384416}