|
{"current_steps": 1, "total_steps": 258, "loss": 2.6815, "lr": 0.0, "epoch": 0.011627906976744186, "percentage": 0.39, "elapsed_time": "0:00:20", "remaining_time": "1:26:31"} |
|
{"current_steps": 2, "total_steps": 258, "loss": 2.8172, "lr": 7.692307692307694e-06, "epoch": 0.023255813953488372, "percentage": 0.78, "elapsed_time": "0:00:36", "remaining_time": "1:17:18"} |
|
{"current_steps": 3, "total_steps": 258, "loss": 2.7979, "lr": 1.5384615384615387e-05, "epoch": 0.03488372093023256, "percentage": 1.16, "elapsed_time": "0:00:52", "remaining_time": "1:14:14"} |
|
{"current_steps": 4, "total_steps": 258, "loss": 2.7698, "lr": 2.307692307692308e-05, "epoch": 0.046511627906976744, "percentage": 1.55, "elapsed_time": "0:01:08", "remaining_time": "1:12:08"} |
|
{"current_steps": 5, "total_steps": 258, "loss": 2.6846, "lr": 3.0769230769230774e-05, "epoch": 0.05813953488372093, "percentage": 1.94, "elapsed_time": "0:01:24", "remaining_time": "1:10:52"} |
|
{"current_steps": 6, "total_steps": 258, "loss": 2.4865, "lr": 3.846153846153846e-05, "epoch": 0.06976744186046512, "percentage": 2.33, "elapsed_time": "0:01:40", "remaining_time": "1:10:11"} |
|
{"current_steps": 7, "total_steps": 258, "loss": 2.3993, "lr": 4.615384615384616e-05, "epoch": 0.08139534883720931, "percentage": 2.71, "elapsed_time": "0:01:56", "remaining_time": "1:09:36"} |
|
{"current_steps": 8, "total_steps": 258, "loss": 2.0547, "lr": 5.384615384615385e-05, "epoch": 0.09302325581395349, "percentage": 3.1, "elapsed_time": "0:02:11", "remaining_time": "1:08:38"} |
|
{"current_steps": 9, "total_steps": 258, "loss": 1.7189, "lr": 6.153846153846155e-05, "epoch": 0.10465116279069768, "percentage": 3.49, "elapsed_time": "0:02:27", "remaining_time": "1:08:03"} |
|
{"current_steps": 10, "total_steps": 258, "loss": 1.4047, "lr": 6.923076923076924e-05, "epoch": 0.11627906976744186, "percentage": 3.88, "elapsed_time": "0:02:44", "remaining_time": "1:07:52"} |
|
{"current_steps": 10, "total_steps": 258, "eval_loss": 1.1081944704055786, "epoch": 0.11627906976744186, "percentage": 3.88, "elapsed_time": "0:03:53", "remaining_time": "1:36:26"} |
|
{"current_steps": 11, "total_steps": 258, "loss": 1.0561, "lr": 7.692307692307693e-05, "epoch": 0.12790697674418605, "percentage": 4.26, "elapsed_time": "0:04:09", "remaining_time": "1:33:25"} |
|
{"current_steps": 12, "total_steps": 258, "loss": 0.7269, "lr": 8.461538461538461e-05, "epoch": 0.13953488372093023, "percentage": 4.65, "elapsed_time": "0:04:25", "remaining_time": "1:30:44"} |
|
{"current_steps": 13, "total_steps": 258, "loss": 0.4613, "lr": 9.230769230769232e-05, "epoch": 0.1511627906976744, "percentage": 5.04, "elapsed_time": "0:04:41", "remaining_time": "1:28:27"} |
|
{"current_steps": 14, "total_steps": 258, "loss": 0.2739, "lr": 0.0001, "epoch": 0.16279069767441862, "percentage": 5.43, "elapsed_time": "0:04:59", "remaining_time": "1:27:01"} |
|
{"current_steps": 15, "total_steps": 258, "loss": 0.1802, "lr": 0.0001076923076923077, "epoch": 0.1744186046511628, "percentage": 5.81, "elapsed_time": "0:05:15", "remaining_time": "1:25:09"} |
|
{"current_steps": 16, "total_steps": 258, "loss": 0.1093, "lr": 0.00011538461538461538, "epoch": 0.18604651162790697, "percentage": 6.2, "elapsed_time": "0:05:31", "remaining_time": "1:23:30"} |
|
{"current_steps": 17, "total_steps": 258, "loss": 0.0676, "lr": 0.0001230769230769231, "epoch": 0.19767441860465115, "percentage": 6.59, "elapsed_time": "0:05:47", "remaining_time": "1:22:04"} |
|
{"current_steps": 18, "total_steps": 258, "loss": 0.045, "lr": 0.00013076923076923077, "epoch": 0.20930232558139536, "percentage": 6.98, "elapsed_time": "0:06:02", "remaining_time": "1:20:38"} |
|
{"current_steps": 19, "total_steps": 258, "loss": 0.0505, "lr": 0.00013846153846153847, "epoch": 0.22093023255813954, "percentage": 7.36, "elapsed_time": "0:06:18", "remaining_time": "1:19:21"} |
|
{"current_steps": 20, "total_steps": 258, "loss": 0.0377, "lr": 0.00014615384615384615, "epoch": 0.23255813953488372, "percentage": 7.75, "elapsed_time": "0:06:35", "remaining_time": "1:18:23"} |
|
{"current_steps": 20, "total_steps": 258, "eval_loss": 0.04212512448430061, "epoch": 0.23255813953488372, "percentage": 7.75, "elapsed_time": "0:07:44", "remaining_time": "1:32:01"} |
|
{"current_steps": 21, "total_steps": 258, "loss": 0.0409, "lr": 0.00015384615384615385, "epoch": 0.2441860465116279, "percentage": 8.14, "elapsed_time": "0:08:00", "remaining_time": "1:30:22"} |
|
{"current_steps": 22, "total_steps": 258, "loss": 0.0322, "lr": 0.00016153846153846155, "epoch": 0.2558139534883721, "percentage": 8.53, "elapsed_time": "0:08:16", "remaining_time": "1:28:45"} |
|
{"current_steps": 23, "total_steps": 258, "loss": 0.0389, "lr": 0.00016923076923076923, "epoch": 0.26744186046511625, "percentage": 8.91, "elapsed_time": "0:08:32", "remaining_time": "1:27:17"} |
|
{"current_steps": 24, "total_steps": 258, "loss": 0.0355, "lr": 0.00017692307692307693, "epoch": 0.27906976744186046, "percentage": 9.3, "elapsed_time": "0:08:48", "remaining_time": "1:25:53"} |
|
{"current_steps": 25, "total_steps": 258, "loss": 0.0392, "lr": 0.00018461538461538463, "epoch": 0.29069767441860467, "percentage": 9.69, "elapsed_time": "0:09:04", "remaining_time": "1:24:31"} |
|
{"current_steps": 26, "total_steps": 258, "loss": 0.0311, "lr": 0.00019230769230769233, "epoch": 0.3023255813953488, "percentage": 10.08, "elapsed_time": "0:09:20", "remaining_time": "1:23:24"} |
|
{"current_steps": 27, "total_steps": 258, "loss": 0.0311, "lr": 0.0002, "epoch": 0.313953488372093, "percentage": 10.47, "elapsed_time": "0:09:37", "remaining_time": "1:22:18"} |
|
{"current_steps": 28, "total_steps": 258, "loss": 0.0304, "lr": 0.00019999083173529673, "epoch": 0.32558139534883723, "percentage": 10.85, "elapsed_time": "0:09:54", "remaining_time": "1:21:19"} |
|
{"current_steps": 29, "total_steps": 258, "loss": 0.0295, "lr": 0.0001999633286223284, "epoch": 0.3372093023255814, "percentage": 11.24, "elapsed_time": "0:10:09", "remaining_time": "1:20:16"} |
|
{"current_steps": 30, "total_steps": 258, "loss": 0.0309, "lr": 0.00019991749570421146, "epoch": 0.3488372093023256, "percentage": 11.63, "elapsed_time": "0:10:26", "remaining_time": "1:19:20"} |
|
{"current_steps": 30, "total_steps": 258, "eval_loss": 0.03273880109190941, "epoch": 0.3488372093023256, "percentage": 11.63, "elapsed_time": "0:11:35", "remaining_time": "1:28:07"} |
|
{"current_steps": 31, "total_steps": 258, "loss": 0.0298, "lr": 0.00019985334138511237, "epoch": 0.36046511627906974, "percentage": 12.02, "elapsed_time": "0:11:51", "remaining_time": "1:26:50"} |
|
{"current_steps": 32, "total_steps": 258, "loss": 0.0346, "lr": 0.0001997708774287068, "epoch": 0.37209302325581395, "percentage": 12.4, "elapsed_time": "0:12:06", "remaining_time": "1:25:33"} |
|
{"current_steps": 33, "total_steps": 258, "loss": 0.0301, "lr": 0.0001996701189560223, "epoch": 0.38372093023255816, "percentage": 12.79, "elapsed_time": "0:12:23", "remaining_time": "1:24:27"} |
|
{"current_steps": 34, "total_steps": 258, "loss": 0.0291, "lr": 0.00019955108444266585, "epoch": 0.3953488372093023, "percentage": 13.18, "elapsed_time": "0:12:38", "remaining_time": "1:23:19"} |
|
{"current_steps": 35, "total_steps": 258, "loss": 0.0302, "lr": 0.00019941379571543596, "epoch": 0.4069767441860465, "percentage": 13.57, "elapsed_time": "0:12:54", "remaining_time": "1:22:14"} |
|
{"current_steps": 36, "total_steps": 258, "loss": 0.0281, "lr": 0.00019925827794832056, "epoch": 0.4186046511627907, "percentage": 13.95, "elapsed_time": "0:13:10", "remaining_time": "1:21:16"} |
|
{"current_steps": 37, "total_steps": 258, "loss": 0.0321, "lr": 0.00019908455965788067, "epoch": 0.43023255813953487, "percentage": 14.34, "elapsed_time": "0:13:26", "remaining_time": "1:20:18"} |
|
{"current_steps": 38, "total_steps": 258, "loss": 0.0285, "lr": 0.00019889267269802176, "epoch": 0.4418604651162791, "percentage": 14.73, "elapsed_time": "0:13:42", "remaining_time": "1:19:23"} |
|
{"current_steps": 39, "total_steps": 258, "loss": 0.0283, "lr": 0.00019868265225415265, "epoch": 0.45348837209302323, "percentage": 15.12, "elapsed_time": "0:13:59", "remaining_time": "1:18:32"} |
|
{"current_steps": 40, "total_steps": 258, "loss": 0.0276, "lr": 0.00019845453683673368, "epoch": 0.46511627906976744, "percentage": 15.5, "elapsed_time": "0:14:15", "remaining_time": "1:17:40"} |
|
{"current_steps": 40, "total_steps": 258, "eval_loss": 0.02999330498278141, "epoch": 0.46511627906976744, "percentage": 15.5, "elapsed_time": "0:15:23", "remaining_time": "1:23:55"} |
|
{"current_steps": 41, "total_steps": 258, "loss": 0.0298, "lr": 0.0001982083682742156, "epoch": 0.47674418604651164, "percentage": 15.89, "elapsed_time": "0:15:39", "remaining_time": "1:22:54"} |
|
{"current_steps": 42, "total_steps": 258, "loss": 0.0264, "lr": 0.00019794419170536916, "epoch": 0.4883720930232558, "percentage": 16.28, "elapsed_time": "0:15:56", "remaining_time": "1:21:58"} |
|
{"current_steps": 43, "total_steps": 258, "loss": 0.0286, "lr": 0.00019766205557100868, "epoch": 0.5, "percentage": 16.67, "elapsed_time": "0:16:15", "remaining_time": "1:21:18"} |
|
{"current_steps": 44, "total_steps": 258, "loss": 0.0282, "lr": 0.00019736201160510931, "epoch": 0.5116279069767442, "percentage": 17.05, "elapsed_time": "0:16:32", "remaining_time": "1:20:25"} |
|
{"current_steps": 45, "total_steps": 258, "loss": 0.0253, "lr": 0.00019704411482532116, "epoch": 0.5232558139534884, "percentage": 17.44, "elapsed_time": "0:16:48", "remaining_time": "1:19:33"} |
|
{"current_steps": 46, "total_steps": 258, "loss": 0.0218, "lr": 0.0001967084235228807, "epoch": 0.5348837209302325, "percentage": 17.83, "elapsed_time": "0:17:04", "remaining_time": "1:18:40"} |
|
{"current_steps": 47, "total_steps": 258, "loss": 0.028, "lr": 0.0001963549992519223, "epoch": 0.5465116279069767, "percentage": 18.22, "elapsed_time": "0:17:20", "remaining_time": "1:17:51"} |
|
{"current_steps": 48, "total_steps": 258, "loss": 0.0302, "lr": 0.0001959839068181914, "epoch": 0.5581395348837209, "percentage": 18.6, "elapsed_time": "0:17:36", "remaining_time": "1:17:00"} |
|
{"current_steps": 49, "total_steps": 258, "loss": 0.0242, "lr": 0.00019559521426716118, "epoch": 0.5697674418604651, "percentage": 18.99, "elapsed_time": "0:17:52", "remaining_time": "1:16:12"} |
|
{"current_steps": 50, "total_steps": 258, "loss": 0.0307, "lr": 0.00019518899287155556, "epoch": 0.5813953488372093, "percentage": 19.38, "elapsed_time": "0:18:07", "remaining_time": "1:15:25"} |
|
{"current_steps": 50, "total_steps": 258, "eval_loss": 0.02883034199476242, "epoch": 0.5813953488372093, "percentage": 19.38, "elapsed_time": "0:19:16", "remaining_time": "1:20:12"} |
|
{"current_steps": 51, "total_steps": 258, "loss": 0.0251, "lr": 0.00019476531711828027, "epoch": 0.5930232558139535, "percentage": 19.77, "elapsed_time": "0:19:39", "remaining_time": "1:19:46"} |
|
{"current_steps": 52, "total_steps": 258, "loss": 0.0252, "lr": 0.0001943242646947643, "epoch": 0.6046511627906976, "percentage": 20.16, "elapsed_time": "0:19:55", "remaining_time": "1:18:56"} |
|
{"current_steps": 53, "total_steps": 258, "loss": 0.0287, "lr": 0.00019386591647471506, "epoch": 0.6162790697674418, "percentage": 20.54, "elapsed_time": "0:20:11", "remaining_time": "1:18:04"} |
|
{"current_steps": 54, "total_steps": 258, "loss": 0.0278, "lr": 0.00019339035650328869, "epoch": 0.627906976744186, "percentage": 20.93, "elapsed_time": "0:20:26", "remaining_time": "1:17:14"} |
|
{"current_steps": 55, "total_steps": 258, "loss": 0.0259, "lr": 0.00019289767198167916, "epoch": 0.6395348837209303, "percentage": 21.32, "elapsed_time": "0:20:42", "remaining_time": "1:16:25"} |
|
{"current_steps": 56, "total_steps": 258, "loss": 0.0252, "lr": 0.0001923879532511287, "epoch": 0.6511627906976745, "percentage": 21.71, "elapsed_time": "0:20:58", "remaining_time": "1:15:39"} |
|
{"current_steps": 57, "total_steps": 258, "loss": 0.0274, "lr": 0.0001918612937763622, "epoch": 0.6627906976744186, "percentage": 22.09, "elapsed_time": "0:21:14", "remaining_time": "1:14:52"} |
|
{"current_steps": 58, "total_steps": 258, "loss": 0.0231, "lr": 0.00019131779012844912, "epoch": 0.6744186046511628, "percentage": 22.48, "elapsed_time": "0:21:29", "remaining_time": "1:14:06"} |
|
{"current_steps": 59, "total_steps": 258, "loss": 0.0224, "lr": 0.00019075754196709572, "epoch": 0.686046511627907, "percentage": 22.87, "elapsed_time": "0:21:45", "remaining_time": "1:13:23"} |
|
{"current_steps": 60, "total_steps": 258, "loss": 0.0266, "lr": 0.00019018065202237083, "epoch": 0.6976744186046512, "percentage": 23.26, "elapsed_time": "0:22:01", "remaining_time": "1:12:41"} |
|
{"current_steps": 60, "total_steps": 258, "eval_loss": 0.028244854882359505, "epoch": 0.6976744186046512, "percentage": 23.26, "elapsed_time": "0:23:10", "remaining_time": "1:16:28"} |
|
{"current_steps": 61, "total_steps": 258, "loss": 0.024, "lr": 0.0001895872260758688, "epoch": 0.7093023255813954, "percentage": 23.64, "elapsed_time": "0:23:26", "remaining_time": "1:15:41"} |
|
{"current_steps": 62, "total_steps": 258, "loss": 0.0237, "lr": 0.00018897737294131284, "epoch": 0.7209302325581395, "percentage": 24.03, "elapsed_time": "0:23:42", "remaining_time": "1:14:57"} |
|
{"current_steps": 63, "total_steps": 258, "loss": 0.0261, "lr": 0.0001883512044446023, "epoch": 0.7325581395348837, "percentage": 24.42, "elapsed_time": "0:23:58", "remaining_time": "1:14:13"} |
|
{"current_steps": 64, "total_steps": 258, "loss": 0.0272, "lr": 0.0001877088354033077, "epoch": 0.7441860465116279, "percentage": 24.81, "elapsed_time": "0:24:15", "remaining_time": "1:13:32"} |
|
{"current_steps": 65, "total_steps": 258, "loss": 0.0246, "lr": 0.0001870503836056172, "epoch": 0.7558139534883721, "percentage": 25.19, "elapsed_time": "0:24:30", "remaining_time": "1:12:47"} |
|
{"current_steps": 66, "total_steps": 258, "loss": 0.0294, "lr": 0.00018637596978873835, "epoch": 0.7674418604651163, "percentage": 25.58, "elapsed_time": "0:24:46", "remaining_time": "1:12:05"} |
|
{"current_steps": 67, "total_steps": 258, "loss": 0.025, "lr": 0.00018568571761675893, "epoch": 0.7790697674418605, "percentage": 25.97, "elapsed_time": "0:25:02", "remaining_time": "1:11:23"} |
|
{"current_steps": 68, "total_steps": 258, "loss": 0.0261, "lr": 0.0001849797536579715, "epoch": 0.7906976744186046, "percentage": 26.36, "elapsed_time": "0:25:18", "remaining_time": "1:10:41"} |
|
{"current_steps": 69, "total_steps": 258, "loss": 0.024, "lr": 0.0001842582073616649, "epoch": 0.8023255813953488, "percentage": 26.74, "elapsed_time": "0:25:33", "remaining_time": "1:10:00"} |
|
{"current_steps": 70, "total_steps": 258, "loss": 0.0293, "lr": 0.000183521211034388, "epoch": 0.813953488372093, "percentage": 27.13, "elapsed_time": "0:25:49", "remaining_time": "1:09:22"} |
|
{"current_steps": 70, "total_steps": 258, "eval_loss": 0.02760264091193676, "epoch": 0.813953488372093, "percentage": 27.13, "elapsed_time": "0:26:58", "remaining_time": "1:12:27"} |
|
{"current_steps": 71, "total_steps": 258, "loss": 0.026, "lr": 0.00018276889981568906, "epoch": 0.8255813953488372, "percentage": 27.52, "elapsed_time": "0:27:14", "remaining_time": "1:11:44"} |
|
{"current_steps": 72, "total_steps": 258, "loss": 0.0247, "lr": 0.0001820014116533359, "epoch": 0.8372093023255814, "percentage": 27.91, "elapsed_time": "0:27:30", "remaining_time": "1:11:03"} |
|
{"current_steps": 73, "total_steps": 258, "loss": 0.0259, "lr": 0.00018121888727802113, "epoch": 0.8488372093023255, "percentage": 28.29, "elapsed_time": "0:27:46", "remaining_time": "1:10:22"} |
|
{"current_steps": 74, "total_steps": 258, "loss": 0.0276, "lr": 0.0001804214701775569, "epoch": 0.8604651162790697, "percentage": 28.68, "elapsed_time": "0:28:02", "remaining_time": "1:09:43"} |
|
{"current_steps": 75, "total_steps": 258, "loss": 0.0229, "lr": 0.00017960930657056438, "epoch": 0.872093023255814, "percentage": 29.07, "elapsed_time": "0:28:18", "remaining_time": "1:09:04"} |
|
{"current_steps": 76, "total_steps": 258, "loss": 0.0202, "lr": 0.00017878254537966216, "epoch": 0.8837209302325582, "percentage": 29.46, "elapsed_time": "0:28:34", "remaining_time": "1:08:26"} |
|
{"current_steps": 77, "total_steps": 258, "loss": 0.026, "lr": 0.00017794133820415916, "epoch": 0.8953488372093024, "percentage": 29.84, "elapsed_time": "0:28:50", "remaining_time": "1:07:47"} |
|
{"current_steps": 78, "total_steps": 258, "loss": 0.0253, "lr": 0.0001770858392922565, "epoch": 0.9069767441860465, "percentage": 30.23, "elapsed_time": "0:29:06", "remaining_time": "1:07:10"} |
|
{"current_steps": 79, "total_steps": 258, "loss": 0.0227, "lr": 0.00017621620551276366, "epoch": 0.9186046511627907, "percentage": 30.62, "elapsed_time": "0:29:22", "remaining_time": "1:06:33"} |
|
{"current_steps": 80, "total_steps": 258, "loss": 0.0254, "lr": 0.00017533259632633442, "epoch": 0.9302325581395349, "percentage": 31.01, "elapsed_time": "0:29:38", "remaining_time": "1:05:56"} |
|
{"current_steps": 80, "total_steps": 258, "eval_loss": 0.026909608393907547, "epoch": 0.9302325581395349, "percentage": 31.01, "elapsed_time": "0:30:47", "remaining_time": "1:08:30"} |
|
{"current_steps": 81, "total_steps": 258, "loss": 0.0261, "lr": 0.00017443517375622704, "epoch": 0.9418604651162791, "percentage": 31.4, "elapsed_time": "0:31:04", "remaining_time": "1:07:54"} |
|
{"current_steps": 82, "total_steps": 258, "loss": 0.0256, "lr": 0.00017352410235859503, "epoch": 0.9534883720930233, "percentage": 31.78, "elapsed_time": "0:31:20", "remaining_time": "1:07:16"} |
|
{"current_steps": 83, "total_steps": 258, "loss": 0.0262, "lr": 0.0001725995491923131, "epoch": 0.9651162790697675, "percentage": 32.17, "elapsed_time": "0:31:36", "remaining_time": "1:06:38"} |
|
{"current_steps": 84, "total_steps": 258, "loss": 0.0251, "lr": 0.00017166168378834448, "epoch": 0.9767441860465116, "percentage": 32.56, "elapsed_time": "0:31:52", "remaining_time": "1:06:01"} |
|
{"current_steps": 85, "total_steps": 258, "loss": 0.0254, "lr": 0.00017071067811865476, "epoch": 0.9883720930232558, "percentage": 32.95, "elapsed_time": "0:32:07", "remaining_time": "1:05:23"} |
|
{"current_steps": 86, "total_steps": 258, "loss": 0.0238, "lr": 0.00016974670656467824, "epoch": 1.0, "percentage": 33.33, "elapsed_time": "0:32:23", "remaining_time": "1:04:47"} |
|
{"current_steps": 87, "total_steps": 258, "loss": 0.0296, "lr": 0.00016876994588534234, "epoch": 1.0116279069767442, "percentage": 33.72, "elapsed_time": "0:32:40", "remaining_time": "1:04:12"} |
|
{"current_steps": 88, "total_steps": 258, "loss": 0.018, "lr": 0.0001677805751846563, "epoch": 1.0232558139534884, "percentage": 34.11, "elapsed_time": "0:32:56", "remaining_time": "1:03:37"} |
|
{"current_steps": 89, "total_steps": 258, "loss": 0.0244, "lr": 0.00016677877587886956, "epoch": 1.0348837209302326, "percentage": 34.5, "elapsed_time": "0:33:11", "remaining_time": "1:03:01"} |
|
{"current_steps": 90, "total_steps": 258, "loss": 0.0215, "lr": 0.00016576473166320644, "epoch": 1.0465116279069768, "percentage": 34.88, "elapsed_time": "0:33:28", "remaining_time": "1:02:29"} |
|
{"current_steps": 90, "total_steps": 258, "eval_loss": 0.026453962549567223, "epoch": 1.0465116279069768, "percentage": 34.88, "elapsed_time": "0:34:37", "remaining_time": "1:04:37"} |
|
{"current_steps": 91, "total_steps": 258, "loss": 0.0251, "lr": 0.00016473862847818277, "epoch": 1.058139534883721, "percentage": 35.27, "elapsed_time": "0:34:53", "remaining_time": "1:04:02"} |
|
{"current_steps": 92, "total_steps": 258, "loss": 0.0224, "lr": 0.00016370065447551078, "epoch": 1.069767441860465, "percentage": 35.66, "elapsed_time": "0:35:09", "remaining_time": "1:03:26"} |
|
{"current_steps": 93, "total_steps": 258, "loss": 0.0236, "lr": 0.00016265099998359866, "epoch": 1.0813953488372092, "percentage": 36.05, "elapsed_time": "0:35:25", "remaining_time": "1:02:51"} |
|
{"current_steps": 94, "total_steps": 258, "loss": 0.0253, "lr": 0.00016158985747265108, "epoch": 1.0930232558139534, "percentage": 36.43, "elapsed_time": "0:35:41", "remaining_time": "1:02:16"} |
|
{"current_steps": 95, "total_steps": 258, "loss": 0.0228, "lr": 0.00016051742151937655, "epoch": 1.1046511627906976, "percentage": 36.82, "elapsed_time": "0:35:57", "remaining_time": "1:01:42"} |
|
{"current_steps": 96, "total_steps": 258, "loss": 0.0193, "lr": 0.000159433888771309, "epoch": 1.1162790697674418, "percentage": 37.21, "elapsed_time": "0:36:14", "remaining_time": "1:01:09"} |
|
{"current_steps": 97, "total_steps": 258, "loss": 0.0206, "lr": 0.00015833945791074943, "epoch": 1.127906976744186, "percentage": 37.6, "elapsed_time": "0:36:29", "remaining_time": "1:00:34"} |
|
{"current_steps": 98, "total_steps": 258, "loss": 0.0189, "lr": 0.0001572343296183344, "epoch": 1.1395348837209303, "percentage": 37.98, "elapsed_time": "0:36:45", "remaining_time": "1:00:00"} |
|
{"current_steps": 99, "total_steps": 258, "loss": 0.0226, "lr": 0.00015611870653623825, "epoch": 1.1511627906976745, "percentage": 38.37, "elapsed_time": "0:37:02", "remaining_time": "0:59:28"} |
|
{"current_steps": 100, "total_steps": 258, "loss": 0.0176, "lr": 0.0001549927932310155, "epoch": 1.1627906976744187, "percentage": 38.76, "elapsed_time": "0:37:17", "remaining_time": "0:58:55"} |
|
{"current_steps": 100, "total_steps": 258, "eval_loss": 0.026211915537714958, "epoch": 1.1627906976744187, "percentage": 38.76, "elapsed_time": "0:38:26", "remaining_time": "1:00:44"} |
|
{"current_steps": 101, "total_steps": 258, "loss": 0.0269, "lr": 0.00015385679615609042, "epoch": 1.1744186046511629, "percentage": 39.15, "elapsed_time": "0:38:43", "remaining_time": "1:00:12"} |
|
{"current_steps": 102, "total_steps": 258, "loss": 0.0258, "lr": 0.00015271092361390077, "epoch": 1.1860465116279069, "percentage": 39.53, "elapsed_time": "0:38:59", "remaining_time": "0:59:37"} |
|
{"current_steps": 103, "total_steps": 258, "loss": 0.0244, "lr": 0.00015155538571770218, "epoch": 1.197674418604651, "percentage": 39.92, "elapsed_time": "0:39:14", "remaining_time": "0:59:03"} |
|
{"current_steps": 104, "total_steps": 258, "loss": 0.0235, "lr": 0.00015039039435304078, "epoch": 1.2093023255813953, "percentage": 40.31, "elapsed_time": "0:39:30", "remaining_time": "0:58:30"} |
|
{"current_steps": 105, "total_steps": 258, "loss": 0.021, "lr": 0.00014921616313890072, "epoch": 1.2209302325581395, "percentage": 40.7, "elapsed_time": "0:39:46", "remaining_time": "0:57:56"} |
|
{"current_steps": 106, "total_steps": 258, "loss": 0.0218, "lr": 0.00014803290738853395, "epoch": 1.2325581395348837, "percentage": 41.09, "elapsed_time": "0:40:02", "remaining_time": "0:57:24"} |
|
{"current_steps": 107, "total_steps": 258, "loss": 0.0197, "lr": 0.00014684084406997903, "epoch": 1.244186046511628, "percentage": 41.47, "elapsed_time": "0:40:18", "remaining_time": "0:56:53"} |
|
{"current_steps": 108, "total_steps": 258, "loss": 0.022, "lr": 0.0001456401917662769, "epoch": 1.255813953488372, "percentage": 41.86, "elapsed_time": "0:40:35", "remaining_time": "0:56:22"} |
|
{"current_steps": 109, "total_steps": 258, "loss": 0.0249, "lr": 0.00014443117063539038, "epoch": 1.2674418604651163, "percentage": 42.25, "elapsed_time": "0:40:52", "remaining_time": "0:55:51"} |
|
{"current_steps": 110, "total_steps": 258, "loss": 0.0227, "lr": 0.00014321400236983457, "epoch": 1.2790697674418605, "percentage": 42.64, "elapsed_time": "0:41:10", "remaining_time": "0:55:24"} |
|
{"current_steps": 110, "total_steps": 258, "eval_loss": 0.025697337463498116, "epoch": 1.2790697674418605, "percentage": 42.64, "elapsed_time": "0:42:19", "remaining_time": "0:56:56"} |
|
{"current_steps": 111, "total_steps": 258, "loss": 0.0225, "lr": 0.00014198891015602646, "epoch": 1.2906976744186047, "percentage": 43.02, "elapsed_time": "0:42:35", "remaining_time": "0:56:23"} |
|
{"current_steps": 112, "total_steps": 258, "loss": 0.0231, "lr": 0.0001407561186333601, "epoch": 1.302325581395349, "percentage": 43.41, "elapsed_time": "0:42:51", "remaining_time": "0:55:52"} |
|
{"current_steps": 113, "total_steps": 258, "loss": 0.0187, "lr": 0.00013951585385301555, "epoch": 1.3139534883720931, "percentage": 43.8, "elapsed_time": "0:43:07", "remaining_time": "0:55:19"} |
|
{"current_steps": 114, "total_steps": 258, "loss": 0.0251, "lr": 0.000138268343236509, "epoch": 1.3255813953488373, "percentage": 44.19, "elapsed_time": "0:43:23", "remaining_time": "0:54:49"} |
|
{"current_steps": 115, "total_steps": 258, "loss": 0.0206, "lr": 0.00013701381553399145, "epoch": 1.3372093023255813, "percentage": 44.57, "elapsed_time": "0:43:40", "remaining_time": "0:54:18"} |
|
{"current_steps": 116, "total_steps": 258, "loss": 0.0195, "lr": 0.000135752500782304, "epoch": 1.3488372093023255, "percentage": 44.96, "elapsed_time": "0:43:56", "remaining_time": "0:53:46"} |
|
{"current_steps": 117, "total_steps": 258, "loss": 0.0253, "lr": 0.00013448463026279704, "epoch": 1.3604651162790697, "percentage": 45.35, "elapsed_time": "0:44:11", "remaining_time": "0:53:15"} |
|
{"current_steps": 118, "total_steps": 258, "loss": 0.0196, "lr": 0.0001332104364589212, "epoch": 1.372093023255814, "percentage": 45.74, "elapsed_time": "0:44:27", "remaining_time": "0:52:45"} |
|
{"current_steps": 119, "total_steps": 258, "loss": 0.0219, "lr": 0.000131930153013598, "epoch": 1.3837209302325582, "percentage": 46.12, "elapsed_time": "0:44:44", "remaining_time": "0:52:15"} |
|
{"current_steps": 120, "total_steps": 258, "loss": 0.0198, "lr": 0.00013064401468637792, "epoch": 1.3953488372093024, "percentage": 46.51, "elapsed_time": "0:44:59", "remaining_time": "0:51:44"} |
|
{"current_steps": 120, "total_steps": 258, "eval_loss": 0.025383805856108665, "epoch": 1.3953488372093024, "percentage": 46.51, "elapsed_time": "0:46:08", "remaining_time": "0:53:03"} |
|
{"current_steps": 121, "total_steps": 258, "loss": 0.0268, "lr": 0.00012935225731039348, "epoch": 1.4069767441860466, "percentage": 46.9, "elapsed_time": "0:46:24", "remaining_time": "0:52:33"} |
|
{"current_steps": 122, "total_steps": 258, "loss": 0.0233, "lr": 0.00012805511774911584, "epoch": 1.4186046511627908, "percentage": 47.29, "elapsed_time": "0:46:40", "remaining_time": "0:52:01"} |
|
{"current_steps": 123, "total_steps": 258, "loss": 0.0222, "lr": 0.00012675283385292212, "epoch": 1.4302325581395348, "percentage": 47.67, "elapsed_time": "0:46:56", "remaining_time": "0:51:31"} |
|
{"current_steps": 124, "total_steps": 258, "loss": 0.0251, "lr": 0.00012544564441548182, "epoch": 1.441860465116279, "percentage": 48.06, "elapsed_time": "0:47:12", "remaining_time": "0:51:01"} |
|
{"current_steps": 125, "total_steps": 258, "loss": 0.0202, "lr": 0.00012413378912997058, "epoch": 1.4534883720930232, "percentage": 48.45, "elapsed_time": "0:47:28", "remaining_time": "0:50:30"} |
|
{"current_steps": 126, "total_steps": 258, "loss": 0.0219, "lr": 0.0001228175085451186, "epoch": 1.4651162790697674, "percentage": 48.84, "elapsed_time": "0:47:44", "remaining_time": "0:50:01"} |
|
{"current_steps": 127, "total_steps": 258, "loss": 0.0185, "lr": 0.00012149704402110243, "epoch": 1.4767441860465116, "percentage": 49.22, "elapsed_time": "0:48:00", "remaining_time": "0:49:31"} |
|
{"current_steps": 128, "total_steps": 258, "loss": 0.0196, "lr": 0.00012017263768528775, "epoch": 1.4883720930232558, "percentage": 49.61, "elapsed_time": "0:48:16", "remaining_time": "0:49:01"} |
|
{"current_steps": 129, "total_steps": 258, "loss": 0.0223, "lr": 0.00011884453238783185, "epoch": 1.5, "percentage": 50.0, "elapsed_time": "0:48:32", "remaining_time": "0:48:32"} |
|
{"current_steps": 130, "total_steps": 258, "loss": 0.0245, "lr": 0.00011751297165715309, "epoch": 1.5116279069767442, "percentage": 50.39, "elapsed_time": "0:48:48", "remaining_time": "0:48:03"} |
|
{"current_steps": 130, "total_steps": 258, "eval_loss": 0.025349650532007217, "epoch": 1.5116279069767442, "percentage": 50.39, "elapsed_time": "0:49:56", "remaining_time": "0:49:10"} |
|
{"current_steps": 131, "total_steps": 258, "loss": 0.0217, "lr": 0.0001161781996552765, "epoch": 1.5232558139534884, "percentage": 50.78, "elapsed_time": "0:50:12", "remaining_time": "0:48:40"} |
|
{"current_steps": 132, "total_steps": 258, "loss": 0.0196, "lr": 0.00011484046113306262, "epoch": 1.5348837209302326, "percentage": 51.16, "elapsed_time": "0:50:28", "remaining_time": "0:48:10"} |
|
{"current_steps": 133, "total_steps": 258, "loss": 0.0237, "lr": 0.00011350000138532902, "epoch": 1.5465116279069768, "percentage": 51.55, "elapsed_time": "0:50:44", "remaining_time": "0:47:41"} |
|
{"current_steps": 134, "total_steps": 258, "loss": 0.0203, "lr": 0.00011215706620587149, "epoch": 1.558139534883721, "percentage": 51.94, "elapsed_time": "0:51:01", "remaining_time": "0:47:12"} |
|
{"current_steps": 135, "total_steps": 258, "loss": 0.0192, "lr": 0.00011081190184239419, "epoch": 1.5697674418604652, "percentage": 52.33, "elapsed_time": "0:51:16", "remaining_time": "0:46:43"} |
|
{"current_steps": 136, "total_steps": 258, "loss": 0.0268, "lr": 0.0001094647549513561, "epoch": 1.5813953488372094, "percentage": 52.71, "elapsed_time": "0:51:32", "remaining_time": "0:46:14"} |
|
{"current_steps": 137, "total_steps": 258, "loss": 0.0213, "lr": 0.00010811587255274313, "epoch": 1.5930232558139537, "percentage": 53.1, "elapsed_time": "0:51:48", "remaining_time": "0:45:45"} |
|
{"current_steps": 138, "total_steps": 258, "loss": 0.0203, "lr": 0.00010676550198477293, "epoch": 1.6046511627906976, "percentage": 53.49, "elapsed_time": "0:52:05", "remaining_time": "0:45:17"} |
|
{"current_steps": 139, "total_steps": 258, "loss": 0.0255, "lr": 0.00010541389085854176, "epoch": 1.6162790697674418, "percentage": 53.88, "elapsed_time": "0:52:21", "remaining_time": "0:44:49"} |
|
{"current_steps": 140, "total_steps": 258, "loss": 0.0217, "lr": 0.00010406128701262128, "epoch": 1.627906976744186, "percentage": 54.26, "elapsed_time": "0:52:37", "remaining_time": "0:44:21"} |
|
{"current_steps": 140, "total_steps": 258, "eval_loss": 0.025237275287508965, "epoch": 1.627906976744186, "percentage": 54.26, "elapsed_time": "0:53:46", "remaining_time": "0:45:19"} |
|
{"current_steps": 141, "total_steps": 258, "loss": 0.022, "lr": 0.00010270793846761347, "epoch": 1.6395348837209303, "percentage": 54.65, "elapsed_time": "0:54:02", "remaining_time": "0:44:50"} |
|
{"current_steps": 142, "total_steps": 258, "loss": 0.0208, "lr": 0.00010135409338067219, "epoch": 1.6511627906976745, "percentage": 55.04, "elapsed_time": "0:54:18", "remaining_time": "0:44:22"} |
|
{"current_steps": 143, "total_steps": 258, "loss": 0.0226, "lr": 0.0001, "epoch": 1.6627906976744184, "percentage": 55.43, "elapsed_time": "0:54:34", "remaining_time": "0:43:53"} |
|
{"current_steps": 144, "total_steps": 258, "loss": 0.0216, "lr": 9.864590661932783e-05, "epoch": 1.6744186046511627, "percentage": 55.81, "elapsed_time": "0:54:50", "remaining_time": "0:43:24"} |
|
{"current_steps": 145, "total_steps": 258, "loss": 0.0255, "lr": 9.729206153238657e-05, "epoch": 1.6860465116279069, "percentage": 56.2, "elapsed_time": "0:55:06", "remaining_time": "0:42:56"} |
|
{"current_steps": 146, "total_steps": 258, "loss": 0.0273, "lr": 9.59387129873787e-05, "epoch": 1.697674418604651, "percentage": 56.59, "elapsed_time": "0:55:22", "remaining_time": "0:42:28"} |
|
{"current_steps": 147, "total_steps": 258, "loss": 0.0206, "lr": 9.458610914145826e-05, "epoch": 1.7093023255813953, "percentage": 56.98, "elapsed_time": "0:55:38", "remaining_time": "0:42:00"} |
|
{"current_steps": 148, "total_steps": 258, "loss": 0.0194, "lr": 9.323449801522709e-05, "epoch": 1.7209302325581395, "percentage": 57.36, "elapsed_time": "0:55:54", "remaining_time": "0:41:33"} |
|
{"current_steps": 149, "total_steps": 258, "loss": 0.0184, "lr": 9.18841274472569e-05, "epoch": 1.7325581395348837, "percentage": 57.75, "elapsed_time": "0:56:11", "remaining_time": "0:41:06"} |
|
{"current_steps": 150, "total_steps": 258, "loss": 0.0209, "lr": 9.05352450486439e-05, "epoch": 1.744186046511628, "percentage": 58.14, "elapsed_time": "0:56:27", "remaining_time": "0:40:39"} |
|
{"current_steps": 150, "total_steps": 258, "eval_loss": 0.024917516857385635, "epoch": 1.744186046511628, "percentage": 58.14, "elapsed_time": "0:57:36", "remaining_time": "0:41:28"} |
|
{"current_steps": 151, "total_steps": 258, "loss": 0.0193, "lr": 8.918809815760585e-05, "epoch": 1.755813953488372, "percentage": 58.53, "elapsed_time": "0:57:53", "remaining_time": "0:41:01"} |
|
{"current_steps": 152, "total_steps": 258, "loss": 0.0234, "lr": 8.78429337941285e-05, "epoch": 1.7674418604651163, "percentage": 58.91, "elapsed_time": "0:58:10", "remaining_time": "0:40:33"} |
|
{"current_steps": 153, "total_steps": 258, "loss": 0.0213, "lr": 8.649999861467099e-05, "epoch": 1.7790697674418605, "percentage": 59.3, "elapsed_time": "0:58:25", "remaining_time": "0:40:05"} |
|
{"current_steps": 154, "total_steps": 258, "loss": 0.02, "lr": 8.515953886693739e-05, "epoch": 1.7906976744186047, "percentage": 59.69, "elapsed_time": "0:58:41", "remaining_time": "0:39:38"} |
|
{"current_steps": 155, "total_steps": 258, "loss": 0.0199, "lr": 8.382180034472353e-05, "epoch": 1.802325581395349, "percentage": 60.08, "elapsed_time": "0:58:58", "remaining_time": "0:39:11"} |
|
{"current_steps": 156, "total_steps": 258, "loss": 0.0227, "lr": 8.248702834284693e-05, "epoch": 1.8139534883720931, "percentage": 60.47, "elapsed_time": "0:59:13", "remaining_time": "0:38:43"} |
|
{"current_steps": 157, "total_steps": 258, "loss": 0.0168, "lr": 8.115546761216822e-05, "epoch": 1.8255813953488373, "percentage": 60.85, "elapsed_time": "0:59:29", "remaining_time": "0:38:16"} |
|
{"current_steps": 158, "total_steps": 258, "loss": 0.022, "lr": 7.982736231471224e-05, "epoch": 1.8372093023255816, "percentage": 61.24, "elapsed_time": "0:59:44", "remaining_time": "0:37:48"} |
|
{"current_steps": 159, "total_steps": 258, "loss": 0.0221, "lr": 7.85029559788976e-05, "epoch": 1.8488372093023255, "percentage": 61.63, "elapsed_time": "1:00:00", "remaining_time": "0:37:21"} |
|
{"current_steps": 160, "total_steps": 258, "loss": 0.0227, "lr": 7.718249145488142e-05, "epoch": 1.8604651162790697, "percentage": 62.02, "elapsed_time": "1:00:16", "remaining_time": "0:36:54"} |
|
{"current_steps": 160, "total_steps": 258, "eval_loss": 0.024740872904658318, "epoch": 1.8604651162790697, "percentage": 62.02, "elapsed_time": "1:01:25", "remaining_time": "0:37:37"} |
|
{"current_steps": 161, "total_steps": 258, "loss": 0.0192, "lr": 7.586621087002945e-05, "epoch": 1.872093023255814, "percentage": 62.4, "elapsed_time": "1:01:40", "remaining_time": "0:37:09"} |
|
{"current_steps": 162, "total_steps": 258, "loss": 0.0213, "lr": 7.455435558451823e-05, "epoch": 1.8837209302325582, "percentage": 62.79, "elapsed_time": "1:01:57", "remaining_time": "0:36:43"} |
|
{"current_steps": 163, "total_steps": 258, "loss": 0.0212, "lr": 7.324716614707793e-05, "epoch": 1.8953488372093024, "percentage": 63.18, "elapsed_time": "1:02:15", "remaining_time": "0:36:17"} |
|
{"current_steps": 164, "total_steps": 258, "loss": 0.0172, "lr": 7.194488225088417e-05, "epoch": 1.9069767441860463, "percentage": 63.57, "elapsed_time": "1:02:31", "remaining_time": "0:35:50"} |
|
{"current_steps": 165, "total_steps": 258, "loss": 0.0218, "lr": 7.064774268960653e-05, "epoch": 1.9186046511627906, "percentage": 63.95, "elapsed_time": "1:02:48", "remaining_time": "0:35:23"} |
|
{"current_steps": 166, "total_steps": 258, "loss": 0.02, "lr": 6.93559853136221e-05, "epoch": 1.9302325581395348, "percentage": 64.34, "elapsed_time": "1:03:04", "remaining_time": "0:34:57"} |
|
{"current_steps": 167, "total_steps": 258, "loss": 0.0245, "lr": 6.806984698640202e-05, "epoch": 1.941860465116279, "percentage": 64.73, "elapsed_time": "1:03:19", "remaining_time": "0:34:30"} |
|
{"current_steps": 168, "total_steps": 258, "loss": 0.025, "lr": 6.678956354107882e-05, "epoch": 1.9534883720930232, "percentage": 65.12, "elapsed_time": "1:03:35", "remaining_time": "0:34:04"} |
|
{"current_steps": 169, "total_steps": 258, "loss": 0.0174, "lr": 6.551536973720298e-05, "epoch": 1.9651162790697674, "percentage": 65.5, "elapsed_time": "1:03:51", "remaining_time": "0:33:38"} |
|
{"current_steps": 170, "total_steps": 258, "loss": 0.0195, "lr": 6.4247499217696e-05, "epoch": 1.9767441860465116, "percentage": 65.89, "elapsed_time": "1:04:07", "remaining_time": "0:33:11"} |
|
{"current_steps": 170, "total_steps": 258, "eval_loss": 0.02444678172469139, "epoch": 1.9767441860465116, "percentage": 65.89, "elapsed_time": "1:05:17", "remaining_time": "0:33:47"} |
|
{"current_steps": 171, "total_steps": 258, "loss": 0.02, "lr": 6.298618446600856e-05, "epoch": 1.9883720930232558, "percentage": 66.28, "elapsed_time": "1:05:32", "remaining_time": "0:33:20"} |
|
{"current_steps": 172, "total_steps": 258, "loss": 0.0211, "lr": 6.173165676349103e-05, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "1:05:48", "remaining_time": "0:32:54"} |
|
{"current_steps": 173, "total_steps": 258, "loss": 0.0205, "lr": 6.048414614698448e-05, "epoch": 2.011627906976744, "percentage": 67.05, "elapsed_time": "1:06:05", "remaining_time": "0:32:28"} |
|
{"current_steps": 174, "total_steps": 258, "loss": 0.0187, "lr": 5.924388136663992e-05, "epoch": 2.0232558139534884, "percentage": 67.44, "elapsed_time": "1:06:20", "remaining_time": "0:32:01"} |
|
{"current_steps": 175, "total_steps": 258, "loss": 0.0153, "lr": 5.801108984397354e-05, "epoch": 2.0348837209302326, "percentage": 67.83, "elapsed_time": "1:06:36", "remaining_time": "0:31:35"} |
|
{"current_steps": 176, "total_steps": 258, "loss": 0.0192, "lr": 5.6785997630165435e-05, "epoch": 2.046511627906977, "percentage": 68.22, "elapsed_time": "1:06:52", "remaining_time": "0:31:09"} |
|
{"current_steps": 177, "total_steps": 258, "loss": 0.0171, "lr": 5.5568829364609664e-05, "epoch": 2.058139534883721, "percentage": 68.6, "elapsed_time": "1:07:09", "remaining_time": "0:30:43"} |
|
{"current_steps": 178, "total_steps": 258, "loss": 0.0184, "lr": 5.435980823372311e-05, "epoch": 2.0697674418604652, "percentage": 68.99, "elapsed_time": "1:07:24", "remaining_time": "0:30:17"} |
|
{"current_steps": 179, "total_steps": 258, "loss": 0.0191, "lr": 5.3159155930021e-05, "epoch": 2.0813953488372094, "percentage": 69.38, "elapsed_time": "1:07:40", "remaining_time": "0:29:51"} |
|
{"current_steps": 180, "total_steps": 258, "loss": 0.0174, "lr": 5.196709261146606e-05, "epoch": 2.0930232558139537, "percentage": 69.77, "elapsed_time": "1:07:55", "remaining_time": "0:29:26"} |
|
{"current_steps": 180, "total_steps": 258, "eval_loss": 0.024556750431656837, "epoch": 2.0930232558139537, "percentage": 69.77, "elapsed_time": "1:09:04", "remaining_time": "0:29:55"} |
|
{"current_steps": 181, "total_steps": 258, "loss": 0.0192, "lr": 5.078383686109926e-05, "epoch": 2.104651162790698, "percentage": 70.16, "elapsed_time": "1:09:20", "remaining_time": "0:29:29"} |
|
{"current_steps": 182, "total_steps": 258, "loss": 0.0182, "lr": 4.9609605646959226e-05, "epoch": 2.116279069767442, "percentage": 70.54, "elapsed_time": "1:09:35", "remaining_time": "0:29:03"} |
|
{"current_steps": 183, "total_steps": 258, "loss": 0.0168, "lr": 4.844461428229782e-05, "epoch": 2.1279069767441863, "percentage": 70.93, "elapsed_time": "1:09:51", "remaining_time": "0:28:37"} |
|
{"current_steps": 184, "total_steps": 258, "loss": 0.0209, "lr": 4.728907638609925e-05, "epoch": 2.13953488372093, "percentage": 71.32, "elapsed_time": "1:10:07", "remaining_time": "0:28:12"} |
|
{"current_steps": 185, "total_steps": 258, "loss": 0.0171, "lr": 4.614320384390959e-05, "epoch": 2.1511627906976742, "percentage": 71.71, "elapsed_time": "1:10:23", "remaining_time": "0:27:46"} |
|
{"current_steps": 186, "total_steps": 258, "loss": 0.0196, "lr": 4.500720676898452e-05, "epoch": 2.1627906976744184, "percentage": 72.09, "elapsed_time": "1:10:39", "remaining_time": "0:27:21"} |
|
{"current_steps": 187, "total_steps": 258, "loss": 0.0154, "lr": 4.388129346376178e-05, "epoch": 2.1744186046511627, "percentage": 72.48, "elapsed_time": "1:10:55", "remaining_time": "0:26:55"} |
|
{"current_steps": 188, "total_steps": 258, "loss": 0.0214, "lr": 4.276567038166563e-05, "epoch": 2.186046511627907, "percentage": 72.87, "elapsed_time": "1:11:11", "remaining_time": "0:26:30"} |
|
{"current_steps": 189, "total_steps": 258, "loss": 0.0162, "lr": 4.16605420892506e-05, "epoch": 2.197674418604651, "percentage": 73.26, "elapsed_time": "1:11:26", "remaining_time": "0:26:05"} |
|
{"current_steps": 190, "total_steps": 258, "loss": 0.018, "lr": 4.0566111228691064e-05, "epoch": 2.2093023255813953, "percentage": 73.64, "elapsed_time": "1:11:42", "remaining_time": "0:25:39"} |
|
{"current_steps": 190, "total_steps": 258, "eval_loss": 0.02473200112581253, "epoch": 2.2093023255813953, "percentage": 73.64, "elapsed_time": "1:12:51", "remaining_time": "0:26:04"} |
|
{"current_steps": 191, "total_steps": 258, "loss": 0.0169, "lr": 3.948257848062351e-05, "epoch": 2.2209302325581395, "percentage": 74.03, "elapsed_time": "1:13:07", "remaining_time": "0:25:38"} |
|
{"current_steps": 192, "total_steps": 258, "loss": 0.0179, "lr": 3.841014252734896e-05, "epoch": 2.2325581395348837, "percentage": 74.42, "elapsed_time": "1:13:23", "remaining_time": "0:25:13"} |
|
{"current_steps": 193, "total_steps": 258, "loss": 0.0185, "lr": 3.734900001640135e-05, "epoch": 2.244186046511628, "percentage": 74.81, "elapsed_time": "1:13:38", "remaining_time": "0:24:48"} |
|
{"current_steps": 194, "total_steps": 258, "loss": 0.0192, "lr": 3.629934552448925e-05, "epoch": 2.255813953488372, "percentage": 75.19, "elapsed_time": "1:13:55", "remaining_time": "0:24:23"} |
|
{"current_steps": 195, "total_steps": 258, "loss": 0.0211, "lr": 3.5261371521817244e-05, "epoch": 2.2674418604651163, "percentage": 75.58, "elapsed_time": "1:14:10", "remaining_time": "0:23:57"} |
|
{"current_steps": 196, "total_steps": 258, "loss": 0.0187, "lr": 3.423526833679355e-05, "epoch": 2.2790697674418605, "percentage": 75.97, "elapsed_time": "1:14:26", "remaining_time": "0:23:32"} |
|
{"current_steps": 197, "total_steps": 258, "loss": 0.0187, "lr": 3.322122412113047e-05, "epoch": 2.2906976744186047, "percentage": 76.36, "elapsed_time": "1:14:42", "remaining_time": "0:23:07"} |
|
{"current_steps": 198, "total_steps": 258, "loss": 0.0175, "lr": 3.2219424815343735e-05, "epoch": 2.302325581395349, "percentage": 76.74, "elapsed_time": "1:14:57", "remaining_time": "0:22:43"} |
|
{"current_steps": 199, "total_steps": 258, "loss": 0.0174, "lr": 3.123005411465766e-05, "epoch": 2.313953488372093, "percentage": 77.13, "elapsed_time": "1:15:14", "remaining_time": "0:22:18"} |
|
{"current_steps": 200, "total_steps": 258, "loss": 0.0176, "lr": 3.0253293435321793e-05, "epoch": 2.3255813953488373, "percentage": 77.52, "elapsed_time": "1:15:30", "remaining_time": "0:21:53"} |
|
{"current_steps": 200, "total_steps": 258, "eval_loss": 0.024754056707024574, "epoch": 2.3255813953488373, "percentage": 77.52, "elapsed_time": "1:16:38", "remaining_time": "0:22:13"} |
|
{"current_steps": 201, "total_steps": 258, "loss": 0.019, "lr": 2.9289321881345254e-05, "epoch": 2.3372093023255816, "percentage": 77.91, "elapsed_time": "1:16:56", "remaining_time": "0:21:49"} |
|
{"current_steps": 202, "total_steps": 258, "loss": 0.0198, "lr": 2.8338316211655536e-05, "epoch": 2.3488372093023258, "percentage": 78.29, "elapsed_time": "1:17:12", "remaining_time": "0:21:24"} |
|
{"current_steps": 203, "total_steps": 258, "loss": 0.0197, "lr": 2.7400450807686938e-05, "epoch": 2.3604651162790695, "percentage": 78.68, "elapsed_time": "1:17:28", "remaining_time": "0:20:59"} |
|
{"current_steps": 204, "total_steps": 258, "loss": 0.0188, "lr": 2.647589764140499e-05, "epoch": 2.3720930232558137, "percentage": 79.07, "elapsed_time": "1:17:44", "remaining_time": "0:20:34"} |
|
{"current_steps": 205, "total_steps": 258, "loss": 0.0171, "lr": 2.5564826243772966e-05, "epoch": 2.383720930232558, "percentage": 79.46, "elapsed_time": "1:18:00", "remaining_time": "0:20:10"} |
|
{"current_steps": 206, "total_steps": 258, "loss": 0.0188, "lr": 2.4667403673665623e-05, "epoch": 2.395348837209302, "percentage": 79.84, "elapsed_time": "1:18:16", "remaining_time": "0:19:45"} |
|
{"current_steps": 207, "total_steps": 258, "loss": 0.0183, "lr": 2.3783794487236365e-05, "epoch": 2.4069767441860463, "percentage": 80.23, "elapsed_time": "1:18:32", "remaining_time": "0:19:21"} |
|
{"current_steps": 208, "total_steps": 258, "loss": 0.0213, "lr": 2.2914160707743538e-05, "epoch": 2.4186046511627906, "percentage": 80.62, "elapsed_time": "1:18:48", "remaining_time": "0:18:56"} |
|
{"current_steps": 209, "total_steps": 258, "loss": 0.0196, "lr": 2.205866179584084e-05, "epoch": 2.4302325581395348, "percentage": 81.01, "elapsed_time": "1:19:06", "remaining_time": "0:18:32"} |
|
{"current_steps": 210, "total_steps": 258, "loss": 0.0149, "lr": 2.121745462033784e-05, "epoch": 2.441860465116279, "percentage": 81.4, "elapsed_time": "1:19:22", "remaining_time": "0:18:08"} |
|
{"current_steps": 210, "total_steps": 258, "eval_loss": 0.02469288930296898, "epoch": 2.441860465116279, "percentage": 81.4, "elapsed_time": "1:20:32", "remaining_time": "0:18:24"} |
|
{"current_steps": 211, "total_steps": 258, "loss": 0.0167, "lr": 2.0390693429435627e-05, "epoch": 2.453488372093023, "percentage": 81.78, "elapsed_time": "1:20:47", "remaining_time": "0:17:59"} |
|
{"current_steps": 212, "total_steps": 258, "loss": 0.0183, "lr": 1.957852982244309e-05, "epoch": 2.4651162790697674, "percentage": 82.17, "elapsed_time": "1:21:03", "remaining_time": "0:17:35"} |
|
{"current_steps": 213, "total_steps": 258, "loss": 0.0165, "lr": 1.87811127219789e-05, "epoch": 2.4767441860465116, "percentage": 82.56, "elapsed_time": "1:21:19", "remaining_time": "0:17:10"} |
|
{"current_steps": 214, "total_steps": 258, "loss": 0.0154, "lr": 1.7998588346664115e-05, "epoch": 2.488372093023256, "percentage": 82.95, "elapsed_time": "1:21:34", "remaining_time": "0:16:46"} |
|
{"current_steps": 215, "total_steps": 258, "loss": 0.017, "lr": 1.7231100184310956e-05, "epoch": 2.5, "percentage": 83.33, "elapsed_time": "1:21:51", "remaining_time": "0:16:22"} |
|
{"current_steps": 216, "total_steps": 258, "loss": 0.0167, "lr": 1.6478788965611993e-05, "epoch": 2.511627906976744, "percentage": 83.72, "elapsed_time": "1:22:06", "remaining_time": "0:15:58"} |
|
{"current_steps": 217, "total_steps": 258, "loss": 0.0208, "lr": 1.5741792638335095e-05, "epoch": 2.5232558139534884, "percentage": 84.11, "elapsed_time": "1:22:22", "remaining_time": "0:15:33"} |
|
{"current_steps": 218, "total_steps": 258, "loss": 0.0191, "lr": 1.502024634202851e-05, "epoch": 2.5348837209302326, "percentage": 84.5, "elapsed_time": "1:22:39", "remaining_time": "0:15:09"} |
|
{"current_steps": 219, "total_steps": 258, "loss": 0.0175, "lr": 1.4314282383241096e-05, "epoch": 2.546511627906977, "percentage": 84.88, "elapsed_time": "1:22:54", "remaining_time": "0:14:45"} |
|
{"current_steps": 220, "total_steps": 258, "loss": 0.0176, "lr": 1.3624030211261685e-05, "epoch": 2.558139534883721, "percentage": 85.27, "elapsed_time": "1:23:10", "remaining_time": "0:14:22"} |
|
{"current_steps": 220, "total_steps": 258, "eval_loss": 0.02466263249516487, "epoch": 2.558139534883721, "percentage": 85.27, "elapsed_time": "1:24:19", "remaining_time": "0:14:33"} |
|
{"current_steps": 221, "total_steps": 258, "loss": 0.0184, "lr": 1.2949616394382802e-05, "epoch": 2.5697674418604652, "percentage": 85.66, "elapsed_time": "1:24:36", "remaining_time": "0:14:09"} |
|
{"current_steps": 222, "total_steps": 258, "loss": 0.0151, "lr": 1.2291164596692305e-05, "epoch": 2.5813953488372094, "percentage": 86.05, "elapsed_time": "1:24:51", "remaining_time": "0:13:45"} |
|
{"current_steps": 223, "total_steps": 258, "loss": 0.0209, "lr": 1.1648795555397719e-05, "epoch": 2.5930232558139537, "percentage": 86.43, "elapsed_time": "1:25:07", "remaining_time": "0:13:21"} |
|
{"current_steps": 224, "total_steps": 258, "loss": 0.0151, "lr": 1.1022627058687163e-05, "epoch": 2.604651162790698, "percentage": 86.82, "elapsed_time": "1:25:23", "remaining_time": "0:12:57"} |
|
{"current_steps": 225, "total_steps": 258, "loss": 0.0167, "lr": 1.0412773924131203e-05, "epoch": 2.616279069767442, "percentage": 87.21, "elapsed_time": "1:25:39", "remaining_time": "0:12:33"} |
|
{"current_steps": 226, "total_steps": 258, "loss": 0.0155, "lr": 9.819347977629202e-06, "epoch": 2.6279069767441863, "percentage": 87.6, "elapsed_time": "1:25:54", "remaining_time": "0:12:09"} |
|
{"current_steps": 227, "total_steps": 258, "loss": 0.0186, "lr": 9.242458032904311e-06, "epoch": 2.6395348837209305, "percentage": 87.98, "elapsed_time": "1:26:12", "remaining_time": "0:11:46"} |
|
{"current_steps": 228, "total_steps": 258, "loss": 0.0156, "lr": 8.682209871550884e-06, "epoch": 2.6511627906976747, "percentage": 88.37, "elapsed_time": "1:26:28", "remaining_time": "0:11:22"} |
|
{"current_steps": 229, "total_steps": 258, "loss": 0.0186, "lr": 8.138706223637827e-06, "epoch": 2.6627906976744184, "percentage": 88.76, "elapsed_time": "1:26:45", "remaining_time": "0:10:59"} |
|
{"current_steps": 230, "total_steps": 258, "loss": 0.016, "lr": 7.612046748871327e-06, "epoch": 2.6744186046511627, "percentage": 89.15, "elapsed_time": "1:27:01", "remaining_time": "0:10:35"} |
|
{"current_steps": 230, "total_steps": 258, "eval_loss": 0.02474929206073284, "epoch": 2.6744186046511627, "percentage": 89.15, "elapsed_time": "1:28:10", "remaining_time": "0:10:44"} |
|
{"current_steps": 231, "total_steps": 258, "loss": 0.0182, "lr": 7.102328018320858e-06, "epoch": 2.686046511627907, "percentage": 89.53, "elapsed_time": "1:28:27", "remaining_time": "0:10:20"} |
|
{"current_steps": 232, "total_steps": 258, "loss": 0.0172, "lr": 6.609643496711349e-06, "epoch": 2.697674418604651, "percentage": 89.92, "elapsed_time": "1:28:42", "remaining_time": "0:09:56"} |
|
{"current_steps": 233, "total_steps": 258, "loss": 0.0184, "lr": 6.13408352528495e-06, "epoch": 2.7093023255813953, "percentage": 90.31, "elapsed_time": "1:28:58", "remaining_time": "0:09:32"} |
|
{"current_steps": 234, "total_steps": 258, "loss": 0.0161, "lr": 5.6757353052356964e-06, "epoch": 2.7209302325581395, "percentage": 90.7, "elapsed_time": "1:29:14", "remaining_time": "0:09:09"} |
|
{"current_steps": 235, "total_steps": 258, "loss": 0.0172, "lr": 5.2346828817197655e-06, "epoch": 2.7325581395348837, "percentage": 91.09, "elapsed_time": "1:29:29", "remaining_time": "0:08:45"} |
|
{"current_steps": 236, "total_steps": 258, "loss": 0.0189, "lr": 4.811007128444445e-06, "epoch": 2.744186046511628, "percentage": 91.47, "elapsed_time": "1:29:47", "remaining_time": "0:08:22"} |
|
{"current_steps": 237, "total_steps": 258, "loss": 0.0141, "lr": 4.404785732838846e-06, "epoch": 2.755813953488372, "percentage": 91.86, "elapsed_time": "1:30:04", "remaining_time": "0:07:58"} |
|
{"current_steps": 238, "total_steps": 258, "loss": 0.0188, "lr": 4.016093181808623e-06, "epoch": 2.7674418604651163, "percentage": 92.25, "elapsed_time": "1:30:19", "remaining_time": "0:07:35"} |
|
{"current_steps": 239, "total_steps": 258, "loss": 0.0187, "lr": 3.6450007480777093e-06, "epoch": 2.7790697674418605, "percentage": 92.64, "elapsed_time": "1:30:35", "remaining_time": "0:07:12"} |
|
{"current_steps": 240, "total_steps": 258, "loss": 0.0202, "lr": 3.2915764771193292e-06, "epoch": 2.7906976744186047, "percentage": 93.02, "elapsed_time": "1:30:52", "remaining_time": "0:06:48"} |
|
{"current_steps": 240, "total_steps": 258, "eval_loss": 0.02471795864403248, "epoch": 2.7906976744186047, "percentage": 93.02, "elapsed_time": "1:32:00", "remaining_time": "0:06:54"} |
|
{"current_steps": 241, "total_steps": 258, "loss": 0.0175, "lr": 2.9558851746788517e-06, "epoch": 2.802325581395349, "percentage": 93.41, "elapsed_time": "1:32:16", "remaining_time": "0:06:30"} |
|
{"current_steps": 242, "total_steps": 258, "loss": 0.0205, "lr": 2.6379883948907e-06, "epoch": 2.813953488372093, "percentage": 93.8, "elapsed_time": "1:32:32", "remaining_time": "0:06:07"} |
|
{"current_steps": 243, "total_steps": 258, "loss": 0.0187, "lr": 2.3379444289913342e-06, "epoch": 2.8255813953488373, "percentage": 94.19, "elapsed_time": "1:32:49", "remaining_time": "0:05:43"} |
|
{"current_steps": 244, "total_steps": 258, "loss": 0.0146, "lr": 2.0558082946308232e-06, "epoch": 2.8372093023255816, "percentage": 94.57, "elapsed_time": "1:33:05", "remaining_time": "0:05:20"} |
|
{"current_steps": 245, "total_steps": 258, "loss": 0.0204, "lr": 1.7916317257844039e-06, "epoch": 2.8488372093023253, "percentage": 94.96, "elapsed_time": "1:33:22", "remaining_time": "0:04:57"} |
|
{"current_steps": 246, "total_steps": 258, "loss": 0.0169, "lr": 1.545463163266303e-06, "epoch": 2.8604651162790695, "percentage": 95.35, "elapsed_time": "1:33:38", "remaining_time": "0:04:34"} |
|
{"current_steps": 247, "total_steps": 258, "loss": 0.0146, "lr": 1.317347745847386e-06, "epoch": 2.8720930232558137, "percentage": 95.74, "elapsed_time": "1:33:54", "remaining_time": "0:04:10"} |
|
{"current_steps": 248, "total_steps": 258, "loss": 0.025, "lr": 1.107327301978245e-06, "epoch": 2.883720930232558, "percentage": 96.12, "elapsed_time": "1:34:10", "remaining_time": "0:03:47"} |
|
{"current_steps": 249, "total_steps": 258, "loss": 0.0175, "lr": 9.154403421193225e-07, "epoch": 2.895348837209302, "percentage": 96.51, "elapsed_time": "1:34:26", "remaining_time": "0:03:24"} |
|
{"current_steps": 250, "total_steps": 258, "loss": 0.0144, "lr": 7.417220516794499e-07, "epoch": 2.9069767441860463, "percentage": 96.9, "elapsed_time": "1:34:41", "remaining_time": "0:03:01"} |
|
{"current_steps": 250, "total_steps": 258, "eval_loss": 0.02471948228776455, "epoch": 2.9069767441860463, "percentage": 96.9, "elapsed_time": "1:35:50", "remaining_time": "0:03:04"} |
|
{"current_steps": 251, "total_steps": 258, "loss": 0.0186, "lr": 5.862042845640403e-07, "epoch": 2.9186046511627906, "percentage": 97.29, "elapsed_time": "1:36:07", "remaining_time": "0:02:40"} |
|
{"current_steps": 252, "total_steps": 258, "loss": 0.0157, "lr": 4.489155573341841e-07, "epoch": 2.9302325581395348, "percentage": 97.67, "elapsed_time": "1:36:23", "remaining_time": "0:02:17"} |
|
{"current_steps": 253, "total_steps": 258, "loss": 0.0169, "lr": 3.298810439777311e-07, "epoch": 2.941860465116279, "percentage": 98.06, "elapsed_time": "1:36:39", "remaining_time": "0:01:54"} |
|
{"current_steps": 254, "total_steps": 258, "loss": 0.0191, "lr": 2.2912257129320547e-07, "epoch": 2.953488372093023, "percentage": 98.45, "elapsed_time": "1:36:56", "remaining_time": "0:01:31"} |
|
{"current_steps": 255, "total_steps": 258, "loss": 0.0203, "lr": 1.4665861488761813e-07, "epoch": 2.9651162790697674, "percentage": 98.84, "elapsed_time": "1:37:13", "remaining_time": "0:01:08"} |
|
{"current_steps": 256, "total_steps": 258, "loss": 0.0159, "lr": 8.250429578855467e-08, "epoch": 2.9767441860465116, "percentage": 99.22, "elapsed_time": "1:37:29", "remaining_time": "0:00:45"} |
|
{"current_steps": 257, "total_steps": 258, "loss": 0.0174, "lr": 3.667137767160433e-08, "epoch": 2.988372093023256, "percentage": 99.61, "elapsed_time": "1:37:45", "remaining_time": "0:00:22"} |
|
{"current_steps": 258, "total_steps": 258, "loss": 0.0185, "lr": 9.168264703285356e-09, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "1:38:00", "remaining_time": "0:00:00"} |
|
{"current_steps": 258, "total_steps": 258, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "1:38:02", "remaining_time": "0:00:00"} |
|
|