|
{"current_steps": 5, "total_steps": 310, "loss": 0.4839, "lr": 9.993582535855265e-06, "epoch": 0.08, "percentage": 1.61, "elapsed_time": "0:06:59", "remaining_time": "7:06:33", "throughput": 1798.3, "total_tokens": 754512} |
|
{"current_steps": 10, "total_steps": 310, "loss": 0.4234, "lr": 9.974346616959476e-06, "epoch": 0.16, "percentage": 3.23, "elapsed_time": "0:12:48", "remaining_time": "6:24:08", "throughput": 1878.91, "total_tokens": 1443544} |
|
{"current_steps": 15, "total_steps": 310, "loss": 0.4307, "lr": 9.942341621640558e-06, "epoch": 0.24, "percentage": 4.84, "elapsed_time": "0:19:13", "remaining_time": "6:17:59", "throughput": 1940.53, "total_tokens": 2237816} |
|
{"current_steps": 20, "total_steps": 310, "loss": 0.4162, "lr": 9.897649706262474e-06, "epoch": 0.32, "percentage": 6.45, "elapsed_time": "0:25:30", "remaining_time": "6:09:50", "throughput": 1974.82, "total_tokens": 3022240} |
|
{"current_steps": 25, "total_steps": 310, "loss": 0.4292, "lr": 9.840385594331022e-06, "epoch": 0.4, "percentage": 8.06, "elapsed_time": "0:32:07", "remaining_time": "6:06:13", "throughput": 1996.5, "total_tokens": 3848256} |
|
{"current_steps": 30, "total_steps": 310, "loss": 0.422, "lr": 9.770696282000245e-06, "epoch": 0.48, "percentage": 9.68, "elapsed_time": "0:38:20", "remaining_time": "5:57:47", "throughput": 2012.49, "total_tokens": 4628944} |
|
{"current_steps": 35, "total_steps": 310, "loss": 0.4019, "lr": 9.688760660735403e-06, "epoch": 0.56, "percentage": 11.29, "elapsed_time": "0:45:16", "remaining_time": "5:55:47", "throughput": 1985.67, "total_tokens": 5395008} |
|
{"current_steps": 40, "total_steps": 310, "loss": 0.3864, "lr": 9.594789058101154e-06, "epoch": 0.64, "percentage": 12.9, "elapsed_time": "0:51:23", "remaining_time": "5:46:50", "throughput": 1992.15, "total_tokens": 6141864} |
|
{"current_steps": 45, "total_steps": 310, "loss": 0.3896, "lr": 9.48902269785371e-06, "epoch": 0.72, "percentage": 14.52, "elapsed_time": "0:57:57", "remaining_time": "5:41:17", "throughput": 1989.42, "total_tokens": 6917880} |
|
{"current_steps": 50, "total_steps": 310, "loss": 0.4077, "lr": 9.371733080722911e-06, "epoch": 0.8, "percentage": 16.13, "elapsed_time": "1:04:28", "remaining_time": "5:35:13", "throughput": 2004.88, "total_tokens": 7755008} |
|
{"current_steps": 55, "total_steps": 310, "loss": 0.3847, "lr": 9.243221287473755e-06, "epoch": 0.88, "percentage": 17.74, "elapsed_time": "1:10:15", "remaining_time": "5:25:46", "throughput": 2024.47, "total_tokens": 8534776} |
|
{"current_steps": 60, "total_steps": 310, "loss": 0.4094, "lr": 9.103817206036383e-06, "epoch": 0.96, "percentage": 19.35, "elapsed_time": "1:16:58", "remaining_time": "5:20:42", "throughput": 2014.46, "total_tokens": 9303408} |
|
{"current_steps": 65, "total_steps": 310, "loss": 0.3788, "lr": 8.953878684688492e-06, "epoch": 1.032, "percentage": 20.97, "elapsed_time": "1:22:28", "remaining_time": "5:10:51", "throughput": 2019.75, "total_tokens": 9994688} |
|
{"current_steps": 70, "total_steps": 310, "loss": 0.3143, "lr": 8.793790613463956e-06, "epoch": 1.112, "percentage": 22.58, "elapsed_time": "1:28:39", "remaining_time": "5:03:59", "throughput": 2015.78, "total_tokens": 10723800} |
|
{"current_steps": 75, "total_steps": 310, "loss": 0.3143, "lr": 8.6239639361456e-06, "epoch": 1.192, "percentage": 24.19, "elapsed_time": "1:35:03", "remaining_time": "4:57:50", "throughput": 2012.55, "total_tokens": 11478016} |
|
{"current_steps": 80, "total_steps": 310, "loss": 0.3205, "lr": 8.444834595378434e-06, "epoch": 1.272, "percentage": 25.81, "elapsed_time": "1:41:26", "remaining_time": "4:51:37", "throughput": 2017.21, "total_tokens": 12276744} |
|
{"current_steps": 85, "total_steps": 310, "loss": 0.2927, "lr": 8.256862413611113e-06, "epoch": 1.3519999999999999, "percentage": 27.42, "elapsed_time": "1:47:46", "remaining_time": "4:45:18", "throughput": 2011.36, "total_tokens": 13007328} |
|
{"current_steps": 90, "total_steps": 310, "loss": 0.3098, "lr": 8.060529912738316e-06, "epoch": 1.432, "percentage": 29.03, "elapsed_time": "1:54:35", "remaining_time": "4:40:05", "throughput": 2019.38, "total_tokens": 13883416} |
|
{"current_steps": 95, "total_steps": 310, "loss": 0.3254, "lr": 7.856341075473963e-06, "epoch": 1.512, "percentage": 30.65, "elapsed_time": "2:01:17", "remaining_time": "4:34:29", "throughput": 2023.56, "total_tokens": 14726032} |
|
{"current_steps": 100, "total_steps": 310, "loss": 0.3029, "lr": 7.644820051634813e-06, "epoch": 1.592, "percentage": 32.26, "elapsed_time": "2:07:38", "remaining_time": "4:28:03", "throughput": 2023.69, "total_tokens": 15499232} |
|
{"current_steps": 105, "total_steps": 310, "loss": 0.3065, "lr": 7.4265098126554065e-06, "epoch": 1.6720000000000002, "percentage": 33.87, "elapsed_time": "2:17:16", "remaining_time": "4:28:00", "throughput": 1975.45, "total_tokens": 16270704} |
|
{"current_steps": 110, "total_steps": 310, "loss": 0.3073, "lr": 7.201970757788172e-06, "epoch": 1.752, "percentage": 35.48, "elapsed_time": "2:23:54", "remaining_time": "4:21:39", "throughput": 1976.98, "total_tokens": 17070776} |
|
{"current_steps": 115, "total_steps": 310, "loss": 0.3311, "lr": 6.971779275566593e-06, "epoch": 1.8319999999999999, "percentage": 37.1, "elapsed_time": "2:30:39", "remaining_time": "4:15:27", "throughput": 1976.62, "total_tokens": 17867208} |
|
{"current_steps": 120, "total_steps": 310, "loss": 0.3137, "lr": 6.736526264224101e-06, "epoch": 1.912, "percentage": 38.71, "elapsed_time": "2:36:55", "remaining_time": "4:08:28", "throughput": 1974.88, "total_tokens": 18595440} |
|
{"current_steps": 125, "total_steps": 310, "loss": 0.3024, "lr": 6.496815614866792e-06, "epoch": 1.992, "percentage": 40.32, "elapsed_time": "2:43:45", "remaining_time": "4:02:21", "throughput": 1968.51, "total_tokens": 19341712} |
|
{"current_steps": 130, "total_steps": 310, "loss": 0.2485, "lr": 6.2532626612936035e-06, "epoch": 2.064, "percentage": 41.94, "elapsed_time": "2:49:12", "remaining_time": "3:54:16", "throughput": 1971.18, "total_tokens": 20011712} |
|
{"current_steps": 135, "total_steps": 310, "loss": 0.2332, "lr": 6.006492600443301e-06, "epoch": 2.144, "percentage": 43.55, "elapsed_time": "2:55:53", "remaining_time": "3:48:00", "throughput": 1966.41, "total_tokens": 20752688} |
|
{"current_steps": 140, "total_steps": 310, "loss": 0.2394, "lr": 5.757138887522884e-06, "epoch": 2.224, "percentage": 45.16, "elapsed_time": "3:02:38", "remaining_time": "3:41:46", "throughput": 1964.28, "total_tokens": 21525792} |
|
{"current_steps": 145, "total_steps": 310, "loss": 0.2253, "lr": 5.505841609937162e-06, "epoch": 2.304, "percentage": 46.77, "elapsed_time": "3:09:20", "remaining_time": "3:35:27", "throughput": 1962.93, "total_tokens": 22300064} |
|
{"current_steps": 150, "total_steps": 310, "loss": 0.2463, "lr": 5.253245844193564e-06, "epoch": 2.384, "percentage": 48.39, "elapsed_time": "3:15:46", "remaining_time": "3:28:49", "throughput": 1966.11, "total_tokens": 23094008} |
|
{"current_steps": 155, "total_steps": 310, "loss": 0.2488, "lr": 5e-06, "epoch": 2.464, "percentage": 50.0, "elapsed_time": "3:22:36", "remaining_time": "3:22:36", "throughput": 1966.69, "total_tokens": 23908816} |
|
{"current_steps": 160, "total_steps": 310, "loss": 0.253, "lr": 4.746754155806437e-06, "epoch": 2.544, "percentage": 51.61, "elapsed_time": "3:28:57", "remaining_time": "3:15:53", "throughput": 1967.78, "total_tokens": 24670168} |
|
{"current_steps": 165, "total_steps": 310, "loss": 0.2318, "lr": 4.49415839006284e-06, "epoch": 2.624, "percentage": 53.23, "elapsed_time": "3:36:12", "remaining_time": "3:10:00", "throughput": 1963.46, "total_tokens": 25471232} |
|
{"current_steps": 170, "total_steps": 310, "loss": 0.2379, "lr": 4.2428611124771184e-06, "epoch": 2.7039999999999997, "percentage": 54.84, "elapsed_time": "3:42:23", "remaining_time": "3:03:09", "throughput": 1966.11, "total_tokens": 26235512} |
|
{"current_steps": 175, "total_steps": 310, "loss": 0.2496, "lr": 3.993507399556699e-06, "epoch": 2.784, "percentage": 56.45, "elapsed_time": "3:48:59", "remaining_time": "2:56:39", "throughput": 1967.06, "total_tokens": 27027008} |
|
{"current_steps": 180, "total_steps": 310, "loss": 0.2189, "lr": 3.7467373387063973e-06, "epoch": 2.864, "percentage": 58.06, "elapsed_time": "3:55:23", "remaining_time": "2:50:00", "throughput": 1964.29, "total_tokens": 27743104} |
|
{"current_steps": 185, "total_steps": 310, "loss": 0.2428, "lr": 3.5031843851332105e-06, "epoch": 2.944, "percentage": 59.68, "elapsed_time": "4:02:02", "remaining_time": "2:43:32", "throughput": 1965.73, "total_tokens": 28547112} |
|
{"current_steps": 190, "total_steps": 310, "loss": 0.2296, "lr": 3.2634737357758994e-06, "epoch": 3.016, "percentage": 61.29, "elapsed_time": "4:07:51", "remaining_time": "2:36:32", "throughput": 1968.18, "total_tokens": 29270520} |
|
{"current_steps": 195, "total_steps": 310, "loss": 0.1756, "lr": 3.0282207244334084e-06, "epoch": 3.096, "percentage": 62.9, "elapsed_time": "4:14:40", "remaining_time": "2:30:11", "throughput": 1965.61, "total_tokens": 30034816} |
|
{"current_steps": 200, "total_steps": 310, "loss": 0.1764, "lr": 2.7980292422118282e-06, "epoch": 3.176, "percentage": 64.52, "elapsed_time": "4:21:16", "remaining_time": "2:23:42", "throughput": 1967.14, "total_tokens": 30838296} |
|
{"current_steps": 205, "total_steps": 310, "loss": 0.1952, "lr": 2.573490187344596e-06, "epoch": 3.2560000000000002, "percentage": 66.13, "elapsed_time": "4:29:59", "remaining_time": "2:18:17", "throughput": 1950.19, "total_tokens": 31592264} |
|
{"current_steps": 210, "total_steps": 310, "loss": 0.1839, "lr": 2.3551799483651894e-06, "epoch": 3.336, "percentage": 67.74, "elapsed_time": "4:36:57", "remaining_time": "2:11:53", "throughput": 1946.58, "total_tokens": 32347456} |
|
{"current_steps": 215, "total_steps": 310, "loss": 0.1875, "lr": 2.1436589245260375e-06, "epoch": 3.416, "percentage": 69.35, "elapsed_time": "4:43:37", "remaining_time": "2:05:19", "throughput": 1947.22, "total_tokens": 33136312} |
|
{"current_steps": 220, "total_steps": 310, "loss": 0.1813, "lr": 1.9394700872616856e-06, "epoch": 3.496, "percentage": 70.97, "elapsed_time": "4:50:01", "remaining_time": "1:58:38", "throughput": 1945.81, "total_tokens": 33859016} |
|
{"current_steps": 225, "total_steps": 310, "loss": 0.1752, "lr": 1.74313758638889e-06, "epoch": 3.576, "percentage": 72.58, "elapsed_time": "4:56:16", "remaining_time": "1:51:55", "throughput": 1950.68, "total_tokens": 34676448} |
|
{"current_steps": 230, "total_steps": 310, "loss": 0.1736, "lr": 1.555165404621567e-06, "epoch": 3.656, "percentage": 74.19, "elapsed_time": "5:02:38", "remaining_time": "1:45:16", "throughput": 1948.14, "total_tokens": 35375424} |
|
{"current_steps": 235, "total_steps": 310, "loss": 0.1902, "lr": 1.3760360638544012e-06, "epoch": 3.7359999999999998, "percentage": 75.81, "elapsed_time": "5:09:17", "remaining_time": "1:38:42", "throughput": 1947.24, "total_tokens": 36136312} |
|
{"current_steps": 240, "total_steps": 310, "loss": 0.1871, "lr": 1.2062093865360458e-06, "epoch": 3.816, "percentage": 77.42, "elapsed_time": "5:15:38", "remaining_time": "1:32:03", "throughput": 1950.44, "total_tokens": 36939320} |
|
{"current_steps": 245, "total_steps": 310, "loss": 0.183, "lr": 1.046121315311508e-06, "epoch": 3.896, "percentage": 79.03, "elapsed_time": "5:21:52", "remaining_time": "1:25:23", "throughput": 1953.63, "total_tokens": 37729192} |
|
{"current_steps": 250, "total_steps": 310, "loss": 0.1809, "lr": 8.961827939636198e-07, "epoch": 3.976, "percentage": 80.65, "elapsed_time": "5:28:46", "remaining_time": "1:18:54", "throughput": 1954.94, "total_tokens": 38564792} |
|
{"current_steps": 255, "total_steps": 310, "loss": 0.1592, "lr": 7.567787125262449e-07, "epoch": 4.048, "percentage": 82.26, "elapsed_time": "5:35:02", "remaining_time": "1:12:15", "throughput": 1953.51, "total_tokens": 39270152} |
|
{"current_steps": 260, "total_steps": 310, "loss": 0.1504, "lr": 6.282669192770896e-07, "epoch": 4.128, "percentage": 83.87, "elapsed_time": "5:41:20", "remaining_time": "1:05:38", "throughput": 1952.51, "total_tokens": 39988296} |
|
{"current_steps": 265, "total_steps": 310, "loss": 0.1556, "lr": 5.109773021462921e-07, "epoch": 4.208, "percentage": 85.48, "elapsed_time": "5:47:31", "remaining_time": "0:59:00", "throughput": 1955.13, "total_tokens": 40767664} |
|
{"current_steps": 270, "total_steps": 310, "loss": 0.1529, "lr": 4.05210941898847e-07, "epoch": 4.288, "percentage": 87.1, "elapsed_time": "5:54:43", "remaining_time": "0:52:33", "throughput": 1954.35, "total_tokens": 41595680} |
|
{"current_steps": 275, "total_steps": 310, "loss": 0.1565, "lr": 3.112393392645985e-07, "epoch": 4.368, "percentage": 88.71, "elapsed_time": "6:01:16", "remaining_time": "0:45:58", "throughput": 1953.12, "total_tokens": 42336752} |
|
{"current_steps": 280, "total_steps": 310, "loss": 0.159, "lr": 2.2930371799975593e-07, "epoch": 4.448, "percentage": 90.32, "elapsed_time": "6:07:27", "remaining_time": "0:39:22", "throughput": 1957.36, "total_tokens": 43154640} |
|
{"current_steps": 285, "total_steps": 310, "loss": 0.1589, "lr": 1.5961440566897913e-07, "epoch": 4.5280000000000005, "percentage": 91.94, "elapsed_time": "6:14:33", "remaining_time": "0:32:51", "throughput": 1959.33, "total_tokens": 44032488} |
|
{"current_steps": 290, "total_steps": 310, "loss": 0.1459, "lr": 1.0235029373752758e-07, "epoch": 4.608, "percentage": 93.55, "elapsed_time": "6:20:46", "remaining_time": "0:26:15", "throughput": 1960.91, "total_tokens": 44799728} |
|
{"current_steps": 295, "total_steps": 310, "loss": 0.1595, "lr": 5.7658378359443104e-08, "epoch": 4.688, "percentage": 95.16, "elapsed_time": "6:27:14", "remaining_time": "0:19:41", "throughput": 1962.17, "total_tokens": 45590936} |
|
{"current_steps": 300, "total_steps": 310, "loss": 0.1772, "lr": 2.5653383040524228e-08, "epoch": 4.768, "percentage": 96.77, "elapsed_time": "6:33:14", "remaining_time": "0:13:06", "throughput": 1963.2, "total_tokens": 46319968} |
|
{"current_steps": 305, "total_steps": 310, "loss": 0.1556, "lr": 6.417464144736208e-09, "epoch": 4.848, "percentage": 98.39, "elapsed_time": "6:42:22", "remaining_time": "0:06:35", "throughput": 1950.0, "total_tokens": 47077304} |
|
{"current_steps": 310, "total_steps": 310, "loss": 0.145, "lr": 0.0, "epoch": 4.928, "percentage": 100.0, "elapsed_time": "6:48:46", "remaining_time": "0:00:00", "throughput": 1949.9, "total_tokens": 47823272} |
|
{"current_steps": 310, "total_steps": 310, "epoch": 4.928, "percentage": 100.0, "elapsed_time": "6:51:08", "remaining_time": "0:00:00", "throughput": 1938.66, "total_tokens": 47823272} |
|
|