|
{"current_steps": 1, "total_steps": 522, "loss": 0.9918, "lr": 0.0, "epoch": 0.005747126436781609, "percentage": 0.19, "elapsed_time": "0:00:54", "remaining_time": "7:51:51"} |
|
{"current_steps": 2, "total_steps": 522, "loss": 0.9604, "lr": 3.7735849056603773e-06, "epoch": 0.011494252873563218, "percentage": 0.38, "elapsed_time": "0:01:42", "remaining_time": "7:22:36"} |
|
{"current_steps": 3, "total_steps": 522, "loss": 0.9868, "lr": 7.547169811320755e-06, "epoch": 0.017241379310344827, "percentage": 0.57, "elapsed_time": "0:02:28", "remaining_time": "7:08:49"} |
|
{"current_steps": 4, "total_steps": 522, "loss": 0.962, "lr": 1.1320754716981132e-05, "epoch": 0.022988505747126436, "percentage": 0.77, "elapsed_time": "0:03:15", "remaining_time": "7:01:40"} |
|
{"current_steps": 5, "total_steps": 522, "loss": 0.9684, "lr": 1.509433962264151e-05, "epoch": 0.028735632183908046, "percentage": 0.96, "elapsed_time": "0:04:05", "remaining_time": "7:03:13"} |
|
{"current_steps": 6, "total_steps": 522, "loss": 0.9442, "lr": 1.8867924528301888e-05, "epoch": 0.034482758620689655, "percentage": 1.15, "elapsed_time": "0:04:57", "remaining_time": "7:06:55"} |
|
{"current_steps": 7, "total_steps": 522, "loss": 0.9382, "lr": 2.2641509433962265e-05, "epoch": 0.040229885057471264, "percentage": 1.34, "elapsed_time": "0:05:52", "remaining_time": "7:12:21"} |
|
{"current_steps": 8, "total_steps": 522, "loss": 0.9416, "lr": 2.641509433962264e-05, "epoch": 0.04597701149425287, "percentage": 1.53, "elapsed_time": "0:06:44", "remaining_time": "7:12:37"} |
|
{"current_steps": 9, "total_steps": 522, "loss": 0.9356, "lr": 3.018867924528302e-05, "epoch": 0.05172413793103448, "percentage": 1.72, "elapsed_time": "0:07:35", "remaining_time": "7:12:51"} |
|
{"current_steps": 10, "total_steps": 522, "loss": 0.9293, "lr": 3.39622641509434e-05, "epoch": 0.05747126436781609, "percentage": 1.92, "elapsed_time": "0:08:26", "remaining_time": "7:12:06"} |
|
{"current_steps": 10, "total_steps": 522, "eval_loss": 1.0470749139785767, "epoch": 0.05747126436781609, "percentage": 1.92, "elapsed_time": "0:15:18", "remaining_time": "13:03:53"} |
|
{"current_steps": 11, "total_steps": 522, "loss": 0.9533, "lr": 3.7735849056603776e-05, "epoch": 0.06321839080459771, "percentage": 2.11, "elapsed_time": "0:16:05", "remaining_time": "12:27:10"} |
|
{"current_steps": 12, "total_steps": 522, "loss": 0.9206, "lr": 4.150943396226415e-05, "epoch": 0.06896551724137931, "percentage": 2.3, "elapsed_time": "0:16:56", "remaining_time": "11:59:47"} |
|
{"current_steps": 13, "total_steps": 522, "loss": 0.8921, "lr": 4.528301886792453e-05, "epoch": 0.07471264367816093, "percentage": 2.49, "elapsed_time": "0:17:49", "remaining_time": "11:37:52"} |
|
{"current_steps": 14, "total_steps": 522, "loss": 0.8861, "lr": 4.9056603773584906e-05, "epoch": 0.08045977011494253, "percentage": 2.68, "elapsed_time": "0:18:45", "remaining_time": "11:20:34"} |
|
{"current_steps": 15, "total_steps": 522, "loss": 0.8904, "lr": 5.283018867924528e-05, "epoch": 0.08620689655172414, "percentage": 2.87, "elapsed_time": "0:19:31", "remaining_time": "11:00:03"} |
|
{"current_steps": 16, "total_steps": 522, "loss": 0.8424, "lr": 5.660377358490566e-05, "epoch": 0.09195402298850575, "percentage": 3.07, "elapsed_time": "0:20:21", "remaining_time": "10:43:35"} |
|
{"current_steps": 17, "total_steps": 522, "loss": 0.8395, "lr": 6.037735849056604e-05, "epoch": 0.09770114942528736, "percentage": 3.26, "elapsed_time": "0:21:07", "remaining_time": "10:27:21"} |
|
{"current_steps": 18, "total_steps": 522, "loss": 0.8203, "lr": 6.415094339622641e-05, "epoch": 0.10344827586206896, "percentage": 3.45, "elapsed_time": "0:21:55", "remaining_time": "10:13:55"} |
|
{"current_steps": 19, "total_steps": 522, "loss": 0.8464, "lr": 6.79245283018868e-05, "epoch": 0.10919540229885058, "percentage": 3.64, "elapsed_time": "0:22:46", "remaining_time": "10:02:48"} |
|
{"current_steps": 20, "total_steps": 522, "loss": 0.8085, "lr": 7.169811320754717e-05, "epoch": 0.11494252873563218, "percentage": 3.83, "elapsed_time": "0:23:32", "remaining_time": "9:50:53"} |
|
{"current_steps": 20, "total_steps": 522, "eval_loss": 0.8244547247886658, "epoch": 0.11494252873563218, "percentage": 3.83, "elapsed_time": "0:30:16", "remaining_time": "12:40:05"} |
|
{"current_steps": 21, "total_steps": 522, "loss": 0.8219, "lr": 7.547169811320755e-05, "epoch": 0.1206896551724138, "percentage": 4.02, "elapsed_time": "0:31:03", "remaining_time": "12:20:49"} |
|
{"current_steps": 22, "total_steps": 522, "loss": 0.8148, "lr": 7.924528301886794e-05, "epoch": 0.12643678160919541, "percentage": 4.21, "elapsed_time": "0:31:50", "remaining_time": "12:03:40"} |
|
{"current_steps": 23, "total_steps": 522, "loss": 0.7846, "lr": 8.30188679245283e-05, "epoch": 0.13218390804597702, "percentage": 4.41, "elapsed_time": "0:32:37", "remaining_time": "11:47:41"} |
|
{"current_steps": 24, "total_steps": 522, "loss": 0.7903, "lr": 8.679245283018869e-05, "epoch": 0.13793103448275862, "percentage": 4.6, "elapsed_time": "0:33:26", "remaining_time": "11:34:04"} |
|
{"current_steps": 25, "total_steps": 522, "loss": 0.7741, "lr": 9.056603773584906e-05, "epoch": 0.14367816091954022, "percentage": 4.79, "elapsed_time": "0:34:13", "remaining_time": "11:20:16"} |
|
{"current_steps": 26, "total_steps": 522, "loss": 0.7308, "lr": 9.433962264150944e-05, "epoch": 0.14942528735632185, "percentage": 4.98, "elapsed_time": "0:34:57", "remaining_time": "11:06:58"} |
|
{"current_steps": 27, "total_steps": 522, "loss": 0.7559, "lr": 9.811320754716981e-05, "epoch": 0.15517241379310345, "percentage": 5.17, "elapsed_time": "0:35:54", "remaining_time": "10:58:25"} |
|
{"current_steps": 28, "total_steps": 522, "loss": 0.7622, "lr": 0.0001018867924528302, "epoch": 0.16091954022988506, "percentage": 5.36, "elapsed_time": "0:36:45", "remaining_time": "10:48:27"} |
|
{"current_steps": 29, "total_steps": 522, "loss": 0.7436, "lr": 0.00010566037735849057, "epoch": 0.16666666666666666, "percentage": 5.56, "elapsed_time": "0:37:31", "remaining_time": "10:37:49"} |
|
{"current_steps": 30, "total_steps": 522, "loss": 0.7547, "lr": 0.00010943396226415095, "epoch": 0.1724137931034483, "percentage": 5.75, "elapsed_time": "0:38:19", "remaining_time": "10:28:35"} |
|
{"current_steps": 30, "total_steps": 522, "eval_loss": 0.7580565214157104, "epoch": 0.1724137931034483, "percentage": 5.75, "elapsed_time": "0:45:04", "remaining_time": "12:19:12"} |
|
{"current_steps": 31, "total_steps": 522, "loss": 0.7337, "lr": 0.00011320754716981132, "epoch": 0.1781609195402299, "percentage": 5.94, "elapsed_time": "0:45:55", "remaining_time": "12:07:23"} |
|
{"current_steps": 32, "total_steps": 522, "loss": 0.7538, "lr": 0.0001169811320754717, "epoch": 0.1839080459770115, "percentage": 6.13, "elapsed_time": "0:46:42", "remaining_time": "11:55:11"} |
|
{"current_steps": 33, "total_steps": 522, "loss": 0.7186, "lr": 0.00012075471698113207, "epoch": 0.1896551724137931, "percentage": 6.32, "elapsed_time": "0:47:30", "remaining_time": "11:43:55"} |
|
{"current_steps": 34, "total_steps": 522, "loss": 0.7719, "lr": 0.00012452830188679244, "epoch": 0.19540229885057472, "percentage": 6.51, "elapsed_time": "0:48:19", "remaining_time": "11:33:32"} |
|
{"current_steps": 35, "total_steps": 522, "loss": 0.752, "lr": 0.00012830188679245283, "epoch": 0.20114942528735633, "percentage": 6.7, "elapsed_time": "0:49:10", "remaining_time": "11:24:11"} |
|
{"current_steps": 36, "total_steps": 522, "loss": 0.7429, "lr": 0.0001320754716981132, "epoch": 0.20689655172413793, "percentage": 6.9, "elapsed_time": "0:49:59", "remaining_time": "11:14:51"} |
|
{"current_steps": 37, "total_steps": 522, "loss": 0.7208, "lr": 0.0001358490566037736, "epoch": 0.21264367816091953, "percentage": 7.09, "elapsed_time": "0:50:47", "remaining_time": "11:05:48"} |
|
{"current_steps": 38, "total_steps": 522, "loss": 0.7651, "lr": 0.00013962264150943395, "epoch": 0.21839080459770116, "percentage": 7.28, "elapsed_time": "0:51:36", "remaining_time": "10:57:18"} |
|
{"current_steps": 39, "total_steps": 522, "loss": 0.7456, "lr": 0.00014339622641509434, "epoch": 0.22413793103448276, "percentage": 7.47, "elapsed_time": "0:52:23", "remaining_time": "10:48:56"} |
|
{"current_steps": 40, "total_steps": 522, "loss": 0.7289, "lr": 0.00014716981132075472, "epoch": 0.22988505747126436, "percentage": 7.66, "elapsed_time": "0:53:14", "remaining_time": "10:41:34"} |
|
{"current_steps": 40, "total_steps": 522, "eval_loss": 0.7386028170585632, "epoch": 0.22988505747126436, "percentage": 7.66, "elapsed_time": "1:00:02", "remaining_time": "12:03:24"} |
|
{"current_steps": 41, "total_steps": 522, "loss": 0.7503, "lr": 0.0001509433962264151, "epoch": 0.23563218390804597, "percentage": 7.85, "elapsed_time": "1:00:54", "remaining_time": "11:54:38"} |
|
{"current_steps": 42, "total_steps": 522, "loss": 0.7392, "lr": 0.0001547169811320755, "epoch": 0.2413793103448276, "percentage": 8.05, "elapsed_time": "1:01:46", "remaining_time": "11:46:01"} |
|
{"current_steps": 43, "total_steps": 522, "loss": 0.7206, "lr": 0.00015849056603773587, "epoch": 0.2471264367816092, "percentage": 8.24, "elapsed_time": "1:02:31", "remaining_time": "11:36:24"} |
|
{"current_steps": 44, "total_steps": 522, "loss": 0.7198, "lr": 0.00016226415094339625, "epoch": 0.25287356321839083, "percentage": 8.43, "elapsed_time": "1:03:17", "remaining_time": "11:27:39"} |
|
{"current_steps": 45, "total_steps": 522, "loss": 0.7393, "lr": 0.0001660377358490566, "epoch": 0.25862068965517243, "percentage": 8.62, "elapsed_time": "1:04:08", "remaining_time": "11:19:55"} |
|
{"current_steps": 46, "total_steps": 522, "loss": 0.7576, "lr": 0.000169811320754717, "epoch": 0.26436781609195403, "percentage": 8.81, "elapsed_time": "1:05:00", "remaining_time": "11:12:42"} |
|
{"current_steps": 47, "total_steps": 522, "loss": 0.7157, "lr": 0.00017358490566037738, "epoch": 0.27011494252873564, "percentage": 9.0, "elapsed_time": "1:05:43", "remaining_time": "11:04:16"} |
|
{"current_steps": 48, "total_steps": 522, "loss": 0.7256, "lr": 0.00017735849056603776, "epoch": 0.27586206896551724, "percentage": 9.2, "elapsed_time": "1:06:36", "remaining_time": "10:57:49"} |
|
{"current_steps": 49, "total_steps": 522, "loss": 0.7295, "lr": 0.00018113207547169812, "epoch": 0.28160919540229884, "percentage": 9.39, "elapsed_time": "1:07:32", "remaining_time": "10:51:55"} |
|
{"current_steps": 50, "total_steps": 522, "loss": 0.6965, "lr": 0.0001849056603773585, "epoch": 0.28735632183908044, "percentage": 9.58, "elapsed_time": "1:08:20", "remaining_time": "10:45:08"} |
|
{"current_steps": 50, "total_steps": 522, "eval_loss": 0.724204421043396, "epoch": 0.28735632183908044, "percentage": 9.58, "elapsed_time": "1:15:05", "remaining_time": "11:48:52"} |
|
{"current_steps": 51, "total_steps": 522, "loss": 0.7273, "lr": 0.00018867924528301889, "epoch": 0.29310344827586204, "percentage": 9.77, "elapsed_time": "1:15:57", "remaining_time": "11:41:32"} |
|
{"current_steps": 52, "total_steps": 522, "loss": 0.7084, "lr": 0.00019245283018867927, "epoch": 0.2988505747126437, "percentage": 9.96, "elapsed_time": "1:16:47", "remaining_time": "11:34:06"} |
|
{"current_steps": 53, "total_steps": 522, "loss": 0.7485, "lr": 0.00019622641509433963, "epoch": 0.3045977011494253, "percentage": 10.15, "elapsed_time": "1:17:40", "remaining_time": "11:27:17"} |
|
{"current_steps": 54, "total_steps": 522, "loss": 0.745, "lr": 0.0002, "epoch": 0.3103448275862069, "percentage": 10.34, "elapsed_time": "1:18:27", "remaining_time": "11:19:56"} |
|
{"current_steps": 55, "total_steps": 522, "loss": 0.7165, "lr": 0.00019999775651876987, "epoch": 0.3160919540229885, "percentage": 10.54, "elapsed_time": "1:19:15", "remaining_time": "11:12:57"} |
|
{"current_steps": 56, "total_steps": 522, "loss": 0.7499, "lr": 0.00019999102617574365, "epoch": 0.3218390804597701, "percentage": 10.73, "elapsed_time": "1:20:01", "remaining_time": "11:05:52"} |
|
{"current_steps": 57, "total_steps": 522, "loss": 0.7118, "lr": 0.00019997980927290927, "epoch": 0.3275862068965517, "percentage": 10.92, "elapsed_time": "1:20:57", "remaining_time": "11:00:30"} |
|
{"current_steps": 58, "total_steps": 522, "loss": 0.6945, "lr": 0.00019996410631356498, "epoch": 0.3333333333333333, "percentage": 11.11, "elapsed_time": "1:21:43", "remaining_time": "10:53:51"} |
|
{"current_steps": 59, "total_steps": 522, "loss": 0.6982, "lr": 0.00019994391800229666, "epoch": 0.3390804597701149, "percentage": 11.3, "elapsed_time": "1:22:35", "remaining_time": "10:48:05"} |
|
{"current_steps": 60, "total_steps": 522, "loss": 0.6848, "lr": 0.00019991924524494627, "epoch": 0.3448275862068966, "percentage": 11.49, "elapsed_time": "1:23:21", "remaining_time": "10:41:55"} |
|
{"current_steps": 60, "total_steps": 522, "eval_loss": 0.7109408378601074, "epoch": 0.3448275862068966, "percentage": 11.49, "elapsed_time": "1:30:06", "remaining_time": "11:33:53"} |
|
{"current_steps": 61, "total_steps": 522, "loss": 0.6899, "lr": 0.00019989008914857116, "epoch": 0.3505747126436782, "percentage": 11.69, "elapsed_time": "1:30:51", "remaining_time": "11:26:41"} |
|
{"current_steps": 62, "total_steps": 522, "loss": 0.7094, "lr": 0.0001998564510213944, "epoch": 0.3563218390804598, "percentage": 11.88, "elapsed_time": "1:31:38", "remaining_time": "11:19:57"} |
|
{"current_steps": 63, "total_steps": 522, "loss": 0.6975, "lr": 0.00019981833237274618, "epoch": 0.3620689655172414, "percentage": 12.07, "elapsed_time": "1:32:25", "remaining_time": "11:13:20"} |
|
{"current_steps": 64, "total_steps": 522, "loss": 0.714, "lr": 0.00019977573491299598, "epoch": 0.367816091954023, "percentage": 12.26, "elapsed_time": "1:33:19", "remaining_time": "11:07:49"} |
|
{"current_steps": 65, "total_steps": 522, "loss": 0.7339, "lr": 0.00019972866055347572, "epoch": 0.3735632183908046, "percentage": 12.45, "elapsed_time": "1:34:09", "remaining_time": "11:01:59"} |
|
{"current_steps": 66, "total_steps": 522, "loss": 0.6821, "lr": 0.0001996771114063943, "epoch": 0.3793103448275862, "percentage": 12.64, "elapsed_time": "1:34:57", "remaining_time": "10:56:01"} |
|
{"current_steps": 67, "total_steps": 522, "loss": 0.7273, "lr": 0.00019962108978474263, "epoch": 0.3850574712643678, "percentage": 12.84, "elapsed_time": "1:35:45", "remaining_time": "10:50:15"} |
|
{"current_steps": 68, "total_steps": 522, "loss": 0.6984, "lr": 0.00019956059820218982, "epoch": 0.39080459770114945, "percentage": 13.03, "elapsed_time": "1:36:37", "remaining_time": "10:45:06"} |
|
{"current_steps": 69, "total_steps": 522, "loss": 0.6778, "lr": 0.00019949563937297045, "epoch": 0.39655172413793105, "percentage": 13.22, "elapsed_time": "1:37:21", "remaining_time": "10:39:08"} |
|
{"current_steps": 70, "total_steps": 522, "loss": 0.693, "lr": 0.00019942621621176282, "epoch": 0.40229885057471265, "percentage": 13.41, "elapsed_time": "1:38:09", "remaining_time": "10:33:46"} |
|
{"current_steps": 70, "total_steps": 522, "eval_loss": 0.7021871209144592, "epoch": 0.40229885057471265, "percentage": 13.41, "elapsed_time": "1:44:55", "remaining_time": "11:17:32"} |
|
{"current_steps": 71, "total_steps": 522, "loss": 0.6967, "lr": 0.0001993523318335581, "epoch": 0.40804597701149425, "percentage": 13.6, "elapsed_time": "1:45:46", "remaining_time": "11:11:52"} |
|
{"current_steps": 72, "total_steps": 522, "loss": 0.7279, "lr": 0.00019927398955352061, "epoch": 0.41379310344827586, "percentage": 13.79, "elapsed_time": "1:46:36", "remaining_time": "11:06:20"} |
|
{"current_steps": 73, "total_steps": 522, "loss": 0.6792, "lr": 0.00019919119288683908, "epoch": 0.41954022988505746, "percentage": 13.98, "elapsed_time": "1:47:25", "remaining_time": "11:00:42"} |
|
{"current_steps": 74, "total_steps": 522, "loss": 0.701, "lr": 0.00019910394554856876, "epoch": 0.42528735632183906, "percentage": 14.18, "elapsed_time": "1:48:14", "remaining_time": "10:55:18"} |
|
{"current_steps": 75, "total_steps": 522, "loss": 0.6805, "lr": 0.0001990122514534651, "epoch": 0.43103448275862066, "percentage": 14.37, "elapsed_time": "1:49:06", "remaining_time": "10:50:14"} |
|
{"current_steps": 76, "total_steps": 522, "loss": 0.7058, "lr": 0.00019891611471580764, "epoch": 0.4367816091954023, "percentage": 14.56, "elapsed_time": "1:49:58", "remaining_time": "10:45:22"} |
|
{"current_steps": 77, "total_steps": 522, "loss": 0.6861, "lr": 0.00019881553964921572, "epoch": 0.4425287356321839, "percentage": 14.75, "elapsed_time": "1:50:50", "remaining_time": "10:40:35"} |
|
{"current_steps": 78, "total_steps": 522, "loss": 0.6969, "lr": 0.00019871053076645488, "epoch": 0.4482758620689655, "percentage": 14.94, "elapsed_time": "1:51:38", "remaining_time": "10:35:31"} |
|
{"current_steps": 79, "total_steps": 522, "loss": 0.7001, "lr": 0.00019860109277923418, "epoch": 0.4540229885057471, "percentage": 15.13, "elapsed_time": "1:52:32", "remaining_time": "10:31:05"} |
|
{"current_steps": 80, "total_steps": 522, "loss": 0.7101, "lr": 0.00019848723059799506, "epoch": 0.45977011494252873, "percentage": 15.33, "elapsed_time": "1:53:24", "remaining_time": "10:26:37"} |
|
{"current_steps": 80, "total_steps": 522, "eval_loss": 0.694656252861023, "epoch": 0.45977011494252873, "percentage": 15.33, "elapsed_time": "2:00:15", "remaining_time": "11:04:27"} |
|
{"current_steps": 81, "total_steps": 522, "loss": 0.6836, "lr": 0.00019836894933169088, "epoch": 0.46551724137931033, "percentage": 15.52, "elapsed_time": "2:01:09", "remaining_time": "10:59:38"} |
|
{"current_steps": 82, "total_steps": 522, "loss": 0.7181, "lr": 0.0001982462542875576, "epoch": 0.47126436781609193, "percentage": 15.71, "elapsed_time": "2:01:59", "remaining_time": "10:54:34"} |
|
{"current_steps": 83, "total_steps": 522, "loss": 0.6645, "lr": 0.00019811915097087587, "epoch": 0.47701149425287354, "percentage": 15.9, "elapsed_time": "2:02:56", "remaining_time": "10:50:16"} |
|
{"current_steps": 84, "total_steps": 522, "loss": 0.6891, "lr": 0.00019798764508472373, "epoch": 0.4827586206896552, "percentage": 16.09, "elapsed_time": "2:03:46", "remaining_time": "10:45:24"} |
|
{"current_steps": 85, "total_steps": 522, "loss": 0.6842, "lr": 0.00019785174252972092, "epoch": 0.4885057471264368, "percentage": 16.28, "elapsed_time": "2:04:32", "remaining_time": "10:40:16"} |
|
{"current_steps": 86, "total_steps": 522, "loss": 0.7047, "lr": 0.0001977114494037641, "epoch": 0.4942528735632184, "percentage": 16.48, "elapsed_time": "2:05:27", "remaining_time": "10:36:03"} |
|
{"current_steps": 87, "total_steps": 522, "loss": 0.7261, "lr": 0.00019756677200175315, "epoch": 0.5, "percentage": 16.67, "elapsed_time": "2:06:16", "remaining_time": "10:31:23"} |
|
{"current_steps": 88, "total_steps": 522, "loss": 0.6699, "lr": 0.0001974177168153088, "epoch": 0.5057471264367817, "percentage": 16.86, "elapsed_time": "2:07:07", "remaining_time": "10:26:57"} |
|
{"current_steps": 89, "total_steps": 522, "loss": 0.6831, "lr": 0.0001972642905324813, "epoch": 0.5114942528735632, "percentage": 17.05, "elapsed_time": "2:08:02", "remaining_time": "10:22:58"} |
|
{"current_steps": 90, "total_steps": 522, "loss": 0.7293, "lr": 0.0001971065000374504, "epoch": 0.5172413793103449, "percentage": 17.24, "elapsed_time": "2:08:53", "remaining_time": "10:18:38"} |
|
{"current_steps": 90, "total_steps": 522, "eval_loss": 0.6888386607170105, "epoch": 0.5172413793103449, "percentage": 17.24, "elapsed_time": "2:15:38", "remaining_time": "10:51:04"} |
|
{"current_steps": 91, "total_steps": 522, "loss": 0.6945, "lr": 0.0001969443524102163, "epoch": 0.5229885057471264, "percentage": 17.43, "elapsed_time": "2:16:28", "remaining_time": "10:46:20"} |
|
{"current_steps": 92, "total_steps": 522, "loss": 0.6985, "lr": 0.0001967778549262822, "epoch": 0.5287356321839081, "percentage": 17.62, "elapsed_time": "2:17:14", "remaining_time": "10:41:27"} |
|
{"current_steps": 93, "total_steps": 522, "loss": 0.6911, "lr": 0.00019660701505632772, "epoch": 0.5344827586206896, "percentage": 17.82, "elapsed_time": "2:18:08", "remaining_time": "10:37:13"} |
|
{"current_steps": 94, "total_steps": 522, "loss": 0.6815, "lr": 0.0001964318404658737, "epoch": 0.5402298850574713, "percentage": 18.01, "elapsed_time": "2:19:01", "remaining_time": "10:32:58"} |
|
{"current_steps": 95, "total_steps": 522, "loss": 0.6664, "lr": 0.00019625233901493822, "epoch": 0.5459770114942529, "percentage": 18.2, "elapsed_time": "2:19:46", "remaining_time": "10:28:15"} |
|
{"current_steps": 96, "total_steps": 522, "loss": 0.6689, "lr": 0.000196068518757684, "epoch": 0.5517241379310345, "percentage": 18.39, "elapsed_time": "2:20:34", "remaining_time": "10:23:46"} |
|
{"current_steps": 97, "total_steps": 522, "loss": 0.6695, "lr": 0.00019588038794205703, "epoch": 0.5574712643678161, "percentage": 18.58, "elapsed_time": "2:21:24", "remaining_time": "10:19:35"} |
|
{"current_steps": 98, "total_steps": 522, "loss": 0.7062, "lr": 0.00019568795500941635, "epoch": 0.5632183908045977, "percentage": 18.77, "elapsed_time": "2:22:16", "remaining_time": "10:15:32"} |
|
{"current_steps": 99, "total_steps": 522, "loss": 0.6891, "lr": 0.00019549122859415538, "epoch": 0.5689655172413793, "percentage": 18.97, "elapsed_time": "2:23:04", "remaining_time": "10:11:20"} |
|
{"current_steps": 100, "total_steps": 522, "loss": 0.6852, "lr": 0.00019529021752331453, "epoch": 0.5747126436781609, "percentage": 19.16, "elapsed_time": "2:23:58", "remaining_time": "10:07:33"} |
|
{"current_steps": 100, "total_steps": 522, "eval_loss": 0.6821601986885071, "epoch": 0.5747126436781609, "percentage": 19.16, "elapsed_time": "2:30:42", "remaining_time": "10:35:59"} |
|
{"current_steps": 101, "total_steps": 522, "loss": 0.6785, "lr": 0.00019508493081618513, "epoch": 0.5804597701149425, "percentage": 19.35, "elapsed_time": "2:31:32", "remaining_time": "10:31:39"} |
|
{"current_steps": 102, "total_steps": 522, "loss": 0.6724, "lr": 0.00019487537768390464, "epoch": 0.5862068965517241, "percentage": 19.54, "elapsed_time": "2:32:22", "remaining_time": "10:27:25"} |
|
{"current_steps": 103, "total_steps": 522, "loss": 0.7117, "lr": 0.00019466156752904343, "epoch": 0.5919540229885057, "percentage": 19.73, "elapsed_time": "2:33:12", "remaining_time": "10:23:14"} |
|
{"current_steps": 104, "total_steps": 522, "loss": 0.6982, "lr": 0.0001944435099451829, "epoch": 0.5977011494252874, "percentage": 19.92, "elapsed_time": "2:34:00", "remaining_time": "10:18:58"} |
|
{"current_steps": 105, "total_steps": 522, "loss": 0.6768, "lr": 0.00019422121471648497, "epoch": 0.603448275862069, "percentage": 20.11, "elapsed_time": "2:34:47", "remaining_time": "10:14:45"} |
|
{"current_steps": 106, "total_steps": 522, "loss": 0.7073, "lr": 0.0001939946918172531, "epoch": 0.6091954022988506, "percentage": 20.31, "elapsed_time": "2:35:39", "remaining_time": "10:10:53"} |
|
{"current_steps": 107, "total_steps": 522, "loss": 0.6831, "lr": 0.00019376395141148476, "epoch": 0.6149425287356322, "percentage": 20.5, "elapsed_time": "2:36:35", "remaining_time": "10:07:20"} |
|
{"current_steps": 108, "total_steps": 522, "loss": 0.6857, "lr": 0.00019352900385241536, "epoch": 0.6206896551724138, "percentage": 20.69, "elapsed_time": "2:37:27", "remaining_time": "10:03:34"} |
|
{"current_steps": 109, "total_steps": 522, "loss": 0.672, "lr": 0.0001932898596820536, "epoch": 0.6264367816091954, "percentage": 20.88, "elapsed_time": "2:38:17", "remaining_time": "9:59:44"} |
|
{"current_steps": 110, "total_steps": 522, "loss": 0.7033, "lr": 0.0001930465296307087, "epoch": 0.632183908045977, "percentage": 21.07, "elapsed_time": "2:39:04", "remaining_time": "9:55:50"} |
|
{"current_steps": 110, "total_steps": 522, "eval_loss": 0.677044153213501, "epoch": 0.632183908045977, "percentage": 21.07, "elapsed_time": "2:45:50", "remaining_time": "10:21:07"} |
|
{"current_steps": 111, "total_steps": 522, "loss": 0.6831, "lr": 0.00019279902461650866, "epoch": 0.6379310344827587, "percentage": 21.26, "elapsed_time": "2:46:41", "remaining_time": "10:17:13"} |
|
{"current_steps": 112, "total_steps": 522, "loss": 0.6654, "lr": 0.00019254735574491058, "epoch": 0.6436781609195402, "percentage": 21.46, "elapsed_time": "2:47:38", "remaining_time": "10:13:41"} |
|
{"current_steps": 113, "total_steps": 522, "loss": 0.6744, "lr": 0.00019229153430820232, "epoch": 0.6494252873563219, "percentage": 21.65, "elapsed_time": "2:48:27", "remaining_time": "10:09:45"} |
|
{"current_steps": 114, "total_steps": 522, "loss": 0.6833, "lr": 0.0001920315717849956, "epoch": 0.6551724137931034, "percentage": 21.84, "elapsed_time": "2:49:13", "remaining_time": "10:05:37"} |
|
{"current_steps": 115, "total_steps": 522, "loss": 0.677, "lr": 0.0001917674798397113, "epoch": 0.6609195402298851, "percentage": 22.03, "elapsed_time": "2:50:03", "remaining_time": "10:01:50"} |
|
{"current_steps": 116, "total_steps": 522, "loss": 0.6828, "lr": 0.00019149927032205587, "epoch": 0.6666666666666666, "percentage": 22.22, "elapsed_time": "2:50:49", "remaining_time": "9:57:54"} |
|
{"current_steps": 117, "total_steps": 522, "loss": 0.6858, "lr": 0.00019122695526648968, "epoch": 0.6724137931034483, "percentage": 22.41, "elapsed_time": "2:51:41", "remaining_time": "9:54:19"} |
|
{"current_steps": 118, "total_steps": 522, "loss": 0.6591, "lr": 0.00019095054689168705, "epoch": 0.6781609195402298, "percentage": 22.61, "elapsed_time": "2:52:37", "remaining_time": "9:51:00"} |
|
{"current_steps": 119, "total_steps": 522, "loss": 0.6669, "lr": 0.00019067005759998797, "epoch": 0.6839080459770115, "percentage": 22.8, "elapsed_time": "2:53:24", "remaining_time": "9:47:16"} |
|
{"current_steps": 120, "total_steps": 522, "loss": 0.6815, "lr": 0.0001903854999768417, "epoch": 0.6896551724137931, "percentage": 22.99, "elapsed_time": "2:54:17", "remaining_time": "9:43:53"} |
|
{"current_steps": 120, "total_steps": 522, "eval_loss": 0.6735538244247437, "epoch": 0.6896551724137931, "percentage": 22.99, "elapsed_time": "3:01:03", "remaining_time": "10:06:33"} |
|
{"current_steps": 121, "total_steps": 522, "loss": 0.67, "lr": 0.0001900968867902419, "epoch": 0.6954022988505747, "percentage": 23.18, "elapsed_time": "3:01:53", "remaining_time": "10:02:47"} |
|
{"current_steps": 122, "total_steps": 522, "loss": 0.6733, "lr": 0.00018980423099015402, "epoch": 0.7011494252873564, "percentage": 23.37, "elapsed_time": "3:02:42", "remaining_time": "9:59:01"} |
|
{"current_steps": 123, "total_steps": 522, "loss": 0.6702, "lr": 0.00018950754570793384, "epoch": 0.7068965517241379, "percentage": 23.56, "elapsed_time": "3:03:33", "remaining_time": "9:55:27"} |
|
{"current_steps": 124, "total_steps": 522, "loss": 0.6619, "lr": 0.00018920684425573865, "epoch": 0.7126436781609196, "percentage": 23.75, "elapsed_time": "3:04:22", "remaining_time": "9:51:45"} |
|
{"current_steps": 125, "total_steps": 522, "loss": 0.6851, "lr": 0.00018890214012592975, "epoch": 0.7183908045977011, "percentage": 23.95, "elapsed_time": "3:05:12", "remaining_time": "9:48:14"} |
|
{"current_steps": 126, "total_steps": 522, "loss": 0.6346, "lr": 0.000188593446990467, "epoch": 0.7241379310344828, "percentage": 24.14, "elapsed_time": "3:06:06", "remaining_time": "9:44:54"} |
|
{"current_steps": 127, "total_steps": 522, "loss": 0.6834, "lr": 0.00018828077870029552, "epoch": 0.7298850574712644, "percentage": 24.33, "elapsed_time": "3:06:55", "remaining_time": "9:41:23"} |
|
{"current_steps": 128, "total_steps": 522, "loss": 0.6279, "lr": 0.00018796414928472417, "epoch": 0.735632183908046, "percentage": 24.52, "elapsed_time": "3:07:42", "remaining_time": "9:37:46"} |
|
{"current_steps": 129, "total_steps": 522, "loss": 0.6348, "lr": 0.0001876435729507959, "epoch": 0.7413793103448276, "percentage": 24.71, "elapsed_time": "3:08:32", "remaining_time": "9:34:23"} |
|
{"current_steps": 130, "total_steps": 522, "loss": 0.679, "lr": 0.0001873190640826505, "epoch": 0.7471264367816092, "percentage": 24.9, "elapsed_time": "3:09:30", "remaining_time": "9:31:27"} |
|
{"current_steps": 130, "total_steps": 522, "eval_loss": 0.6707044243812561, "epoch": 0.7471264367816092, "percentage": 24.9, "elapsed_time": "3:16:18", "remaining_time": "9:51:56"} |
|
{"current_steps": 131, "total_steps": 522, "loss": 0.6423, "lr": 0.00018699063724087904, "epoch": 0.7528735632183908, "percentage": 25.1, "elapsed_time": "3:17:12", "remaining_time": "9:48:36"} |
|
{"current_steps": 132, "total_steps": 522, "loss": 0.6654, "lr": 0.00018665830716187065, "epoch": 0.7586206896551724, "percentage": 25.29, "elapsed_time": "3:18:00", "remaining_time": "9:45:02"} |
|
{"current_steps": 133, "total_steps": 522, "loss": 0.6866, "lr": 0.0001863220887571512, "epoch": 0.764367816091954, "percentage": 25.48, "elapsed_time": "3:18:56", "remaining_time": "9:41:50"} |
|
{"current_steps": 134, "total_steps": 522, "loss": 0.7014, "lr": 0.0001859819971127143, "epoch": 0.7701149425287356, "percentage": 25.67, "elapsed_time": "3:19:45", "remaining_time": "9:38:24"} |
|
{"current_steps": 135, "total_steps": 522, "loss": 0.6769, "lr": 0.00018563804748834438, "epoch": 0.7758620689655172, "percentage": 25.86, "elapsed_time": "3:20:38", "remaining_time": "9:35:11"} |
|
{"current_steps": 136, "total_steps": 522, "loss": 0.6821, "lr": 0.000185290255316932, "epoch": 0.7816091954022989, "percentage": 26.05, "elapsed_time": "3:21:36", "remaining_time": "9:32:11"} |
|
{"current_steps": 137, "total_steps": 522, "loss": 0.6614, "lr": 0.00018493863620378122, "epoch": 0.7873563218390804, "percentage": 26.25, "elapsed_time": "3:22:37", "remaining_time": "9:29:25"} |
|
{"current_steps": 138, "total_steps": 522, "loss": 0.6699, "lr": 0.00018458320592590975, "epoch": 0.7931034482758621, "percentage": 26.44, "elapsed_time": "3:23:26", "remaining_time": "9:26:07"} |
|
{"current_steps": 139, "total_steps": 522, "loss": 0.6795, "lr": 0.00018422398043134067, "epoch": 0.7988505747126436, "percentage": 26.63, "elapsed_time": "3:24:18", "remaining_time": "9:22:56"} |
|
{"current_steps": 140, "total_steps": 522, "loss": 0.6571, "lr": 0.00018386097583838714, "epoch": 0.8045977011494253, "percentage": 26.82, "elapsed_time": "3:25:05", "remaining_time": "9:19:36"} |
|
{"current_steps": 140, "total_steps": 522, "eval_loss": 0.6682229042053223, "epoch": 0.8045977011494253, "percentage": 26.82, "elapsed_time": "3:31:50", "remaining_time": "9:38:01"} |
|
{"current_steps": 141, "total_steps": 522, "loss": 0.6524, "lr": 0.00018349420843492888, "epoch": 0.8103448275862069, "percentage": 27.01, "elapsed_time": "3:32:45", "remaining_time": "9:34:54"} |
|
{"current_steps": 142, "total_steps": 522, "loss": 0.6685, "lr": 0.00018312369467768166, "epoch": 0.8160919540229885, "percentage": 27.2, "elapsed_time": "3:33:39", "remaining_time": "9:31:44"} |
|
{"current_steps": 143, "total_steps": 522, "loss": 0.659, "lr": 0.0001827494511914587, "epoch": 0.8218390804597702, "percentage": 27.39, "elapsed_time": "3:34:27", "remaining_time": "9:28:23"} |
|
{"current_steps": 144, "total_steps": 522, "loss": 0.6792, "lr": 0.0001823714947684247, "epoch": 0.8275862068965517, "percentage": 27.59, "elapsed_time": "3:35:12", "remaining_time": "9:24:56"} |
|
{"current_steps": 145, "total_steps": 522, "loss": 0.6954, "lr": 0.00018198984236734246, "epoch": 0.8333333333333334, "percentage": 27.78, "elapsed_time": "3:36:01", "remaining_time": "9:21:39"} |
|
{"current_steps": 146, "total_steps": 522, "loss": 0.6527, "lr": 0.000181604511112812, "epoch": 0.8390804597701149, "percentage": 27.97, "elapsed_time": "3:36:47", "remaining_time": "9:18:17"} |
|
{"current_steps": 147, "total_steps": 522, "loss": 0.6571, "lr": 0.000181215518294502, "epoch": 0.8448275862068966, "percentage": 28.16, "elapsed_time": "3:37:31", "remaining_time": "9:14:53"} |
|
{"current_steps": 148, "total_steps": 522, "loss": 0.6773, "lr": 0.00018082288136637422, "epoch": 0.8505747126436781, "percentage": 28.35, "elapsed_time": "3:38:23", "remaining_time": "9:11:52"} |
|
{"current_steps": 149, "total_steps": 522, "loss": 0.7066, "lr": 0.00018042661794590023, "epoch": 0.8563218390804598, "percentage": 28.54, "elapsed_time": "3:39:09", "remaining_time": "9:08:37"} |
|
{"current_steps": 150, "total_steps": 522, "loss": 0.6491, "lr": 0.00018002674581327094, "epoch": 0.8620689655172413, "percentage": 28.74, "elapsed_time": "3:40:01", "remaining_time": "9:05:39"} |
|
{"current_steps": 150, "total_steps": 522, "eval_loss": 0.6660047769546509, "epoch": 0.8620689655172413, "percentage": 28.74, "elapsed_time": "3:46:47", "remaining_time": "9:22:27"} |
|
{"current_steps": 151, "total_steps": 522, "loss": 0.7081, "lr": 0.00017962328291059888, "epoch": 0.867816091954023, "percentage": 28.93, "elapsed_time": "3:47:40", "remaining_time": "9:19:23"} |
|
{"current_steps": 152, "total_steps": 522, "loss": 0.6622, "lr": 0.00017921624734111292, "epoch": 0.8735632183908046, "percentage": 29.12, "elapsed_time": "3:48:30", "remaining_time": "9:16:13"} |
|
{"current_steps": 153, "total_steps": 522, "loss": 0.6393, "lr": 0.0001788056573683464, "epoch": 0.8793103448275862, "percentage": 29.31, "elapsed_time": "3:49:20", "remaining_time": "9:13:07"} |
|
{"current_steps": 154, "total_steps": 522, "loss": 0.6384, "lr": 0.00017839153141531718, "epoch": 0.8850574712643678, "percentage": 29.5, "elapsed_time": "3:50:15", "remaining_time": "9:10:14"} |
|
{"current_steps": 155, "total_steps": 522, "loss": 0.6512, "lr": 0.00017797388806370132, "epoch": 0.8908045977011494, "percentage": 29.69, "elapsed_time": "3:51:03", "remaining_time": "9:07:04"} |
|
{"current_steps": 156, "total_steps": 522, "loss": 0.6502, "lr": 0.00017755274605299923, "epoch": 0.896551724137931, "percentage": 29.89, "elapsed_time": "3:51:52", "remaining_time": "9:04:00"} |
|
{"current_steps": 157, "total_steps": 522, "loss": 0.6666, "lr": 0.00017712812427969485, "epoch": 0.9022988505747126, "percentage": 30.08, "elapsed_time": "3:52:38", "remaining_time": "9:00:51"} |
|
{"current_steps": 158, "total_steps": 522, "loss": 0.6495, "lr": 0.00017670004179640774, "epoch": 0.9080459770114943, "percentage": 30.27, "elapsed_time": "3:53:30", "remaining_time": "8:57:57"} |
|
{"current_steps": 159, "total_steps": 522, "loss": 0.6747, "lr": 0.0001762685178110382, "epoch": 0.9137931034482759, "percentage": 30.46, "elapsed_time": "3:54:20", "remaining_time": "8:55:00"} |
|
{"current_steps": 160, "total_steps": 522, "loss": 0.7015, "lr": 0.0001758335716859055, "epoch": 0.9195402298850575, "percentage": 30.65, "elapsed_time": "3:55:09", "remaining_time": "8:52:02"} |
|
{"current_steps": 160, "total_steps": 522, "eval_loss": 0.663636326789856, "epoch": 0.9195402298850575, "percentage": 30.65, "elapsed_time": "4:01:54", "remaining_time": "9:07:18"} |
|
{"current_steps": 161, "total_steps": 522, "loss": 0.6825, "lr": 0.00017539522293687898, "epoch": 0.9252873563218391, "percentage": 30.84, "elapsed_time": "4:02:45", "remaining_time": "9:04:18"} |
|
{"current_steps": 162, "total_steps": 522, "loss": 0.674, "lr": 0.00017495349123250242, "epoch": 0.9310344827586207, "percentage": 31.03, "elapsed_time": "4:03:32", "remaining_time": "9:01:11"} |
|
{"current_steps": 163, "total_steps": 522, "loss": 0.6477, "lr": 0.00017450839639311162, "epoch": 0.9367816091954023, "percentage": 31.23, "elapsed_time": "4:04:25", "remaining_time": "8:58:20"} |
|
{"current_steps": 164, "total_steps": 522, "loss": 0.6742, "lr": 0.00017405995838994494, "epoch": 0.9425287356321839, "percentage": 31.42, "elapsed_time": "4:05:14", "remaining_time": "8:55:20"} |
|
{"current_steps": 165, "total_steps": 522, "loss": 0.6509, "lr": 0.00017360819734424715, "epoch": 0.9482758620689655, "percentage": 31.61, "elapsed_time": "4:05:59", "remaining_time": "8:52:13"} |
|
{"current_steps": 166, "total_steps": 522, "loss": 0.6602, "lr": 0.0001731531335263669, "epoch": 0.9540229885057471, "percentage": 31.8, "elapsed_time": "4:06:47", "remaining_time": "8:49:16"} |
|
{"current_steps": 167, "total_steps": 522, "loss": 0.6697, "lr": 0.00017269478735484683, "epoch": 0.9597701149425287, "percentage": 31.99, "elapsed_time": "4:07:32", "remaining_time": "8:46:12"} |
|
{"current_steps": 168, "total_steps": 522, "loss": 0.6636, "lr": 0.00017223317939550753, "epoch": 0.9655172413793104, "percentage": 32.18, "elapsed_time": "4:08:17", "remaining_time": "8:43:11"} |
|
{"current_steps": 169, "total_steps": 522, "loss": 0.6733, "lr": 0.00017176833036052495, "epoch": 0.9712643678160919, "percentage": 32.38, "elapsed_time": "4:09:03", "remaining_time": "8:40:12"} |
|
{"current_steps": 170, "total_steps": 522, "loss": 0.6523, "lr": 0.0001713002611075007, "epoch": 0.9770114942528736, "percentage": 32.57, "elapsed_time": "4:09:54", "remaining_time": "8:37:27"} |
|
{"current_steps": 170, "total_steps": 522, "eval_loss": 0.6618800759315491, "epoch": 0.9770114942528736, "percentage": 32.57, "elapsed_time": "4:16:45", "remaining_time": "8:51:38"} |
|
{"current_steps": 171, "total_steps": 522, "loss": 0.658, "lr": 0.0001708289926385265, "epoch": 0.9827586206896551, "percentage": 32.76, "elapsed_time": "4:17:34", "remaining_time": "8:48:42"} |
|
{"current_steps": 172, "total_steps": 522, "loss": 0.6697, "lr": 0.0001703545460992416, "epoch": 0.9885057471264368, "percentage": 32.95, "elapsed_time": "4:18:24", "remaining_time": "8:45:48"} |
|
{"current_steps": 173, "total_steps": 522, "loss": 0.6231, "lr": 0.00016987694277788417, "epoch": 0.9942528735632183, "percentage": 33.14, "elapsed_time": "4:19:16", "remaining_time": "8:43:02"} |
|
{"current_steps": 174, "total_steps": 522, "loss": 0.6374, "lr": 0.0001693962041043359, "epoch": 1.0, "percentage": 33.33, "elapsed_time": "4:20:03", "remaining_time": "8:40:07"} |
|
{"current_steps": 175, "total_steps": 522, "loss": 0.6271, "lr": 0.00016891235164916065, "epoch": 1.0057471264367817, "percentage": 33.52, "elapsed_time": "4:21:07", "remaining_time": "8:37:46"} |
|
{"current_steps": 176, "total_steps": 522, "loss": 0.649, "lr": 0.00016842540712263637, "epoch": 1.0114942528735633, "percentage": 33.72, "elapsed_time": "4:22:01", "remaining_time": "8:35:06"} |
|
{"current_steps": 177, "total_steps": 522, "loss": 0.654, "lr": 0.00016793539237378128, "epoch": 1.0172413793103448, "percentage": 33.91, "elapsed_time": "4:22:52", "remaining_time": "8:32:23"} |
|
{"current_steps": 178, "total_steps": 522, "loss": 0.6313, "lr": 0.00016744232938937308, "epoch": 1.0229885057471264, "percentage": 34.1, "elapsed_time": "4:23:47", "remaining_time": "8:29:47"} |
|
{"current_steps": 179, "total_steps": 522, "loss": 0.6803, "lr": 0.0001669462402929629, "epoch": 1.028735632183908, "percentage": 34.29, "elapsed_time": "4:24:30", "remaining_time": "8:26:51"} |
|
{"current_steps": 180, "total_steps": 522, "loss": 0.6672, "lr": 0.00016644714734388217, "epoch": 1.0344827586206897, "percentage": 34.48, "elapsed_time": "4:25:20", "remaining_time": "8:24:08"} |
|
{"current_steps": 180, "total_steps": 522, "eval_loss": 0.6602174043655396, "epoch": 1.0344827586206897, "percentage": 34.48, "elapsed_time": "4:32:10", "remaining_time": "8:37:08"} |
|
{"current_steps": 181, "total_steps": 522, "loss": 0.6257, "lr": 0.00016594507293624425, "epoch": 1.0402298850574712, "percentage": 34.67, "elapsed_time": "4:33:03", "remaining_time": "8:34:25"} |
|
{"current_steps": 182, "total_steps": 522, "loss": 0.641, "lr": 0.00016544003959793925, "epoch": 1.0459770114942528, "percentage": 34.87, "elapsed_time": "4:33:53", "remaining_time": "8:31:39"} |
|
{"current_steps": 183, "total_steps": 522, "loss": 0.6351, "lr": 0.00016493206998962354, "epoch": 1.0517241379310345, "percentage": 35.06, "elapsed_time": "4:34:43", "remaining_time": "8:28:55"} |
|
{"current_steps": 184, "total_steps": 522, "loss": 0.6635, "lr": 0.0001644211869037027, "epoch": 1.0574712643678161, "percentage": 35.25, "elapsed_time": "4:35:32", "remaining_time": "8:26:09"} |
|
{"current_steps": 185, "total_steps": 522, "loss": 0.6458, "lr": 0.00016390741326330907, "epoch": 1.0632183908045978, "percentage": 35.44, "elapsed_time": "4:36:26", "remaining_time": "8:23:33"} |
|
{"current_steps": 186, "total_steps": 522, "loss": 0.6209, "lr": 0.00016339077212127294, "epoch": 1.0689655172413792, "percentage": 35.63, "elapsed_time": "4:37:20", "remaining_time": "8:20:59"} |
|
{"current_steps": 187, "total_steps": 522, "loss": 0.6336, "lr": 0.0001628712866590885, "epoch": 1.0747126436781609, "percentage": 35.82, "elapsed_time": "4:38:06", "remaining_time": "8:18:12"} |
|
{"current_steps": 188, "total_steps": 522, "loss": 0.6496, "lr": 0.00016234898018587337, "epoch": 1.0804597701149425, "percentage": 36.02, "elapsed_time": "4:38:58", "remaining_time": "8:15:37"} |
|
{"current_steps": 189, "total_steps": 522, "loss": 0.668, "lr": 0.00016182387613732291, "epoch": 1.0862068965517242, "percentage": 36.21, "elapsed_time": "4:39:44", "remaining_time": "8:12:52"} |
|
{"current_steps": 190, "total_steps": 522, "loss": 0.6862, "lr": 0.00016129599807465875, "epoch": 1.0919540229885056, "percentage": 36.4, "elapsed_time": "4:40:38", "remaining_time": "8:10:22"} |
|
{"current_steps": 190, "total_steps": 522, "eval_loss": 0.6588147282600403, "epoch": 1.0919540229885056, "percentage": 36.4, "elapsed_time": "4:47:24", "remaining_time": "8:22:12"} |
|
{"current_steps": 191, "total_steps": 522, "loss": 0.6367, "lr": 0.0001607653696835713, "epoch": 1.0977011494252873, "percentage": 36.59, "elapsed_time": "4:48:13", "remaining_time": "8:19:28"} |
|
{"current_steps": 192, "total_steps": 522, "loss": 0.6391, "lr": 0.00016023201477315731, "epoch": 1.103448275862069, "percentage": 36.78, "elapsed_time": "4:49:07", "remaining_time": "8:16:56"} |
|
{"current_steps": 193, "total_steps": 522, "loss": 0.6462, "lr": 0.0001596959572748514, "epoch": 1.1091954022988506, "percentage": 36.97, "elapsed_time": "4:49:58", "remaining_time": "8:14:18"} |
|
{"current_steps": 194, "total_steps": 522, "loss": 0.6356, "lr": 0.00015915722124135227, "epoch": 1.1149425287356323, "percentage": 37.16, "elapsed_time": "4:50:50", "remaining_time": "8:11:43"} |
|
{"current_steps": 195, "total_steps": 522, "loss": 0.6557, "lr": 0.00015861583084554349, "epoch": 1.1206896551724137, "percentage": 37.36, "elapsed_time": "4:51:40", "remaining_time": "8:09:06"} |
|
{"current_steps": 196, "total_steps": 522, "loss": 0.6401, "lr": 0.0001580718103794089, "epoch": 1.1264367816091954, "percentage": 37.55, "elapsed_time": "4:52:31", "remaining_time": "8:06:32"} |
|
{"current_steps": 197, "total_steps": 522, "loss": 0.6641, "lr": 0.00015752518425294257, "epoch": 1.132183908045977, "percentage": 37.74, "elapsed_time": "4:53:21", "remaining_time": "8:03:58"} |
|
{"current_steps": 198, "total_steps": 522, "loss": 0.6689, "lr": 0.00015697597699305366, "epoch": 1.1379310344827587, "percentage": 37.93, "elapsed_time": "4:54:10", "remaining_time": "8:01:22"} |
|
{"current_steps": 199, "total_steps": 522, "loss": 0.663, "lr": 0.00015642421324246568, "epoch": 1.1436781609195403, "percentage": 38.12, "elapsed_time": "4:54:58", "remaining_time": "7:58:47"} |
|
{"current_steps": 200, "total_steps": 522, "loss": 0.6755, "lr": 0.00015586991775861102, "epoch": 1.1494252873563218, "percentage": 38.31, "elapsed_time": "4:55:49", "remaining_time": "7:56:17"} |
|
{"current_steps": 200, "total_steps": 522, "eval_loss": 0.6577329635620117, "epoch": 1.1494252873563218, "percentage": 38.31, "elapsed_time": "5:02:36", "remaining_time": "8:07:11"} |
|
{"current_steps": 201, "total_steps": 522, "loss": 0.62, "lr": 0.00015531311541251995, "epoch": 1.1551724137931034, "percentage": 38.51, "elapsed_time": "5:03:29", "remaining_time": "8:04:40"} |
|
{"current_steps": 202, "total_steps": 522, "loss": 0.6456, "lr": 0.00015475383118770472, "epoch": 1.160919540229885, "percentage": 38.7, "elapsed_time": "5:04:21", "remaining_time": "8:02:09"} |
|
{"current_steps": 203, "total_steps": 522, "loss": 0.6421, "lr": 0.00015419209017903852, "epoch": 1.1666666666666667, "percentage": 38.89, "elapsed_time": "5:05:10", "remaining_time": "7:59:34"} |
|
{"current_steps": 204, "total_steps": 522, "loss": 0.6342, "lr": 0.0001536279175916296, "epoch": 1.1724137931034484, "percentage": 39.08, "elapsed_time": "5:05:59", "remaining_time": "7:56:58"} |
|
{"current_steps": 205, "total_steps": 522, "loss": 0.6533, "lr": 0.0001530613387396901, "epoch": 1.1781609195402298, "percentage": 39.27, "elapsed_time": "5:06:56", "remaining_time": "7:54:38"} |
|
{"current_steps": 206, "total_steps": 522, "loss": 0.6511, "lr": 0.0001524923790454004, "epoch": 1.1839080459770115, "percentage": 39.46, "elapsed_time": "5:07:49", "remaining_time": "7:52:11"} |
|
{"current_steps": 207, "total_steps": 522, "loss": 0.6363, "lr": 0.00015192106403776848, "epoch": 1.1896551724137931, "percentage": 39.66, "elapsed_time": "5:08:45", "remaining_time": "7:49:50"} |
|
{"current_steps": 208, "total_steps": 522, "loss": 0.6517, "lr": 0.0001513474193514842, "epoch": 1.1954022988505748, "percentage": 39.85, "elapsed_time": "5:09:34", "remaining_time": "7:47:20"} |
|
{"current_steps": 209, "total_steps": 522, "loss": 0.6264, "lr": 0.00015077147072576933, "epoch": 1.2011494252873562, "percentage": 40.04, "elapsed_time": "5:10:28", "remaining_time": "7:44:58"} |
|
{"current_steps": 210, "total_steps": 522, "loss": 0.6279, "lr": 0.00015019324400322243, "epoch": 1.206896551724138, "percentage": 40.23, "elapsed_time": "5:11:13", "remaining_time": "7:42:24"} |
|
{"current_steps": 210, "total_steps": 522, "eval_loss": 0.6562607884407043, "epoch": 1.206896551724138, "percentage": 40.23, "elapsed_time": "5:18:01", "remaining_time": "7:52:30"} |
|
{"current_steps": 211, "total_steps": 522, "loss": 0.6726, "lr": 0.00014961276512865954, "epoch": 1.2126436781609196, "percentage": 40.42, "elapsed_time": "5:18:56", "remaining_time": "7:50:05"} |
|
{"current_steps": 212, "total_steps": 522, "loss": 0.6493, "lr": 0.00014903006014794983, "epoch": 1.2183908045977012, "percentage": 40.61, "elapsed_time": "5:19:56", "remaining_time": "7:47:50"} |
|
{"current_steps": 213, "total_steps": 522, "loss": 0.6367, "lr": 0.00014844515520684703, "epoch": 1.2241379310344827, "percentage": 40.8, "elapsed_time": "5:20:46", "remaining_time": "7:45:20"} |
|
{"current_steps": 214, "total_steps": 522, "loss": 0.6734, "lr": 0.00014785807654981627, "epoch": 1.2298850574712643, "percentage": 41.0, "elapsed_time": "5:21:33", "remaining_time": "7:42:47"} |
|
{"current_steps": 215, "total_steps": 522, "loss": 0.6354, "lr": 0.00014726885051885653, "epoch": 1.235632183908046, "percentage": 41.19, "elapsed_time": "5:22:21", "remaining_time": "7:40:18"} |
|
{"current_steps": 216, "total_steps": 522, "loss": 0.6412, "lr": 0.0001466775035523186, "epoch": 1.2413793103448276, "percentage": 41.38, "elapsed_time": "5:23:15", "remaining_time": "7:37:56"} |
|
{"current_steps": 217, "total_steps": 522, "loss": 0.6635, "lr": 0.00014608406218371894, "epoch": 1.2471264367816093, "percentage": 41.57, "elapsed_time": "5:24:07", "remaining_time": "7:35:34"} |
|
{"current_steps": 218, "total_steps": 522, "loss": 0.6403, "lr": 0.00014548855304054886, "epoch": 1.2528735632183907, "percentage": 41.76, "elapsed_time": "5:24:56", "remaining_time": "7:33:07"} |
|
{"current_steps": 219, "total_steps": 522, "loss": 0.6253, "lr": 0.00014489100284308017, "epoch": 1.2586206896551724, "percentage": 41.95, "elapsed_time": "5:25:45", "remaining_time": "7:30:43"} |
|
{"current_steps": 220, "total_steps": 522, "loss": 0.6622, "lr": 0.00014429143840316585, "epoch": 1.264367816091954, "percentage": 42.15, "elapsed_time": "5:26:33", "remaining_time": "7:28:15"} |
|
{"current_steps": 220, "total_steps": 522, "eval_loss": 0.6551185250282288, "epoch": 1.264367816091954, "percentage": 42.15, "elapsed_time": "5:33:21", "remaining_time": "7:37:36"} |
|
{"current_steps": 221, "total_steps": 522, "loss": 0.6226, "lr": 0.00014368988662303732, "epoch": 1.2701149425287357, "percentage": 42.34, "elapsed_time": "5:34:09", "remaining_time": "7:35:07"} |
|
{"current_steps": 222, "total_steps": 522, "loss": 0.6661, "lr": 0.00014308637449409706, "epoch": 1.2758620689655173, "percentage": 42.53, "elapsed_time": "5:35:04", "remaining_time": "7:32:47"} |
|
{"current_steps": 223, "total_steps": 522, "loss": 0.6243, "lr": 0.00014248092909570774, "epoch": 1.2816091954022988, "percentage": 42.72, "elapsed_time": "5:35:52", "remaining_time": "7:30:21"} |
|
{"current_steps": 224, "total_steps": 522, "loss": 0.6348, "lr": 0.00014187357759397714, "epoch": 1.2873563218390804, "percentage": 42.91, "elapsed_time": "5:36:39", "remaining_time": "7:27:52"} |
|
{"current_steps": 225, "total_steps": 522, "loss": 0.6386, "lr": 0.00014126434724053913, "epoch": 1.293103448275862, "percentage": 43.1, "elapsed_time": "5:37:31", "remaining_time": "7:25:32"} |
|
{"current_steps": 226, "total_steps": 522, "loss": 0.6276, "lr": 0.00014065326537133094, "epoch": 1.2988505747126438, "percentage": 43.3, "elapsed_time": "5:38:20", "remaining_time": "7:23:08"} |
|
{"current_steps": 227, "total_steps": 522, "loss": 0.6431, "lr": 0.0001400403594053667, "epoch": 1.3045977011494254, "percentage": 43.49, "elapsed_time": "5:39:14", "remaining_time": "7:20:51"} |
|
{"current_steps": 228, "total_steps": 522, "loss": 0.6457, "lr": 0.00013942565684350698, "epoch": 1.3103448275862069, "percentage": 43.68, "elapsed_time": "5:40:07", "remaining_time": "7:18:34"} |
|
{"current_steps": 229, "total_steps": 522, "loss": 0.6247, "lr": 0.00013880918526722497, "epoch": 1.3160919540229885, "percentage": 43.87, "elapsed_time": "5:40:59", "remaining_time": "7:16:17"} |
|
{"current_steps": 230, "total_steps": 522, "loss": 0.6329, "lr": 0.00013819097233736888, "epoch": 1.3218390804597702, "percentage": 44.06, "elapsed_time": "5:41:49", "remaining_time": "7:13:57"} |
|
{"current_steps": 230, "total_steps": 522, "eval_loss": 0.6541800498962402, "epoch": 1.3218390804597702, "percentage": 44.06, "elapsed_time": "5:48:34", "remaining_time": "7:22:31"} |
|
{"current_steps": 231, "total_steps": 522, "loss": 0.6697, "lr": 0.00013757104579292082, "epoch": 1.3275862068965516, "percentage": 44.25, "elapsed_time": "5:49:24", "remaining_time": "7:20:09"} |
|
{"current_steps": 232, "total_steps": 522, "loss": 0.6279, "lr": 0.00013694943344975212, "epoch": 1.3333333333333333, "percentage": 44.44, "elapsed_time": "5:50:21", "remaining_time": "7:17:56"} |
|
{"current_steps": 233, "total_steps": 522, "loss": 0.6487, "lr": 0.00013632616319937522, "epoch": 1.339080459770115, "percentage": 44.64, "elapsed_time": "5:51:08", "remaining_time": "7:15:31"} |
|
{"current_steps": 234, "total_steps": 522, "loss": 0.6456, "lr": 0.00013570126300769232, "epoch": 1.3448275862068966, "percentage": 44.83, "elapsed_time": "5:51:57", "remaining_time": "7:13:10"} |
|
{"current_steps": 235, "total_steps": 522, "loss": 0.6302, "lr": 0.0001350747609137404, "epoch": 1.3505747126436782, "percentage": 45.02, "elapsed_time": "5:52:46", "remaining_time": "7:10:50"} |
|
{"current_steps": 236, "total_steps": 522, "loss": 0.6184, "lr": 0.0001344466850284333, "epoch": 1.3563218390804597, "percentage": 45.21, "elapsed_time": "5:53:41", "remaining_time": "7:08:37"} |
|
{"current_steps": 237, "total_steps": 522, "loss": 0.6618, "lr": 0.00013381706353330014, "epoch": 1.3620689655172413, "percentage": 45.4, "elapsed_time": "5:54:30", "remaining_time": "7:06:18"} |
|
{"current_steps": 238, "total_steps": 522, "loss": 0.6191, "lr": 0.0001331859246792211, "epoch": 1.367816091954023, "percentage": 45.59, "elapsed_time": "5:55:19", "remaining_time": "7:03:59"} |
|
{"current_steps": 239, "total_steps": 522, "loss": 0.6397, "lr": 0.0001325532967851596, "epoch": 1.3735632183908046, "percentage": 45.79, "elapsed_time": "5:56:07", "remaining_time": "7:01:41"} |
|
{"current_steps": 240, "total_steps": 522, "loss": 0.6559, "lr": 0.00013191920823689177, "epoch": 1.3793103448275863, "percentage": 45.98, "elapsed_time": "5:56:56", "remaining_time": "6:59:24"} |
|
{"current_steps": 240, "total_steps": 522, "eval_loss": 0.6528159379959106, "epoch": 1.3793103448275863, "percentage": 45.98, "elapsed_time": "6:03:44", "remaining_time": "7:07:23"} |
|
{"current_steps": 241, "total_steps": 522, "loss": 0.6736, "lr": 0.00013128368748573273, "epoch": 1.3850574712643677, "percentage": 46.17, "elapsed_time": "6:04:36", "remaining_time": "7:05:07"} |
|
{"current_steps": 242, "total_steps": 522, "loss": 0.6467, "lr": 0.00013064676304726, "epoch": 1.3908045977011494, "percentage": 46.36, "elapsed_time": "6:05:23", "remaining_time": "7:02:46"} |
|
{"current_steps": 243, "total_steps": 522, "loss": 0.6956, "lr": 0.0001300084635000341, "epoch": 1.396551724137931, "percentage": 46.55, "elapsed_time": "6:06:09", "remaining_time": "7:00:23"} |
|
{"current_steps": 244, "total_steps": 522, "loss": 0.6474, "lr": 0.000129368817484316, "epoch": 1.4022988505747127, "percentage": 46.74, "elapsed_time": "6:07:02", "remaining_time": "6:58:10"} |
|
{"current_steps": 245, "total_steps": 522, "loss": 0.6301, "lr": 0.0001287278537007824, "epoch": 1.4080459770114944, "percentage": 46.93, "elapsed_time": "6:07:50", "remaining_time": "6:55:52"} |
|
{"current_steps": 246, "total_steps": 522, "loss": 0.6238, "lr": 0.00012808560090923758, "epoch": 1.4137931034482758, "percentage": 47.13, "elapsed_time": "6:08:40", "remaining_time": "6:53:38"} |
|
{"current_steps": 247, "total_steps": 522, "loss": 0.6383, "lr": 0.00012744208792732324, "epoch": 1.4195402298850575, "percentage": 47.32, "elapsed_time": "6:09:30", "remaining_time": "6:51:23"} |
|
{"current_steps": 248, "total_steps": 522, "loss": 0.642, "lr": 0.00012679734362922528, "epoch": 1.4252873563218391, "percentage": 47.51, "elapsed_time": "6:10:22", "remaining_time": "6:49:12"} |
|
{"current_steps": 249, "total_steps": 522, "loss": 0.6152, "lr": 0.00012615139694437835, "epoch": 1.4310344827586206, "percentage": 47.7, "elapsed_time": "6:11:10", "remaining_time": "6:46:56"} |
|
{"current_steps": 250, "total_steps": 522, "loss": 0.6389, "lr": 0.00012550427685616765, "epoch": 1.4367816091954024, "percentage": 47.89, "elapsed_time": "6:12:00", "remaining_time": "6:44:44"} |
|
{"current_steps": 250, "total_steps": 522, "eval_loss": 0.6516815423965454, "epoch": 1.4367816091954024, "percentage": 47.89, "elapsed_time": "6:18:51", "remaining_time": "6:52:12"} |
|
{"current_steps": 251, "total_steps": 522, "loss": 0.6365, "lr": 0.00012485601240062869, "epoch": 1.4425287356321839, "percentage": 48.08, "elapsed_time": "6:19:42", "remaining_time": "6:49:58"} |
|
{"current_steps": 252, "total_steps": 522, "loss": 0.6345, "lr": 0.00012420663266514417, "epoch": 1.4482758620689655, "percentage": 48.28, "elapsed_time": "6:20:37", "remaining_time": "6:47:48"} |
|
{"current_steps": 253, "total_steps": 522, "loss": 0.6365, "lr": 0.0001235561667871391, "epoch": 1.4540229885057472, "percentage": 48.47, "elapsed_time": "6:21:27", "remaining_time": "6:45:34"} |
|
{"current_steps": 254, "total_steps": 522, "loss": 0.6316, "lr": 0.0001229046439527732, "epoch": 1.4597701149425286, "percentage": 48.66, "elapsed_time": "6:22:25", "remaining_time": "6:43:29"} |
|
{"current_steps": 255, "total_steps": 522, "loss": 0.6221, "lr": 0.00012225209339563145, "epoch": 1.4655172413793103, "percentage": 48.85, "elapsed_time": "6:23:20", "remaining_time": "6:41:22"} |
|
{"current_steps": 256, "total_steps": 522, "loss": 0.6485, "lr": 0.00012159854439541245, "epoch": 1.471264367816092, "percentage": 49.04, "elapsed_time": "6:24:06", "remaining_time": "6:39:06"} |
|
{"current_steps": 257, "total_steps": 522, "loss": 0.6607, "lr": 0.00012094402627661447, "epoch": 1.4770114942528736, "percentage": 49.23, "elapsed_time": "6:24:53", "remaining_time": "6:36:52"} |
|
{"current_steps": 258, "total_steps": 522, "loss": 0.6764, "lr": 0.00012028856840721974, "epoch": 1.4827586206896552, "percentage": 49.43, "elapsed_time": "6:25:40", "remaining_time": "6:34:38"} |
|
{"current_steps": 259, "total_steps": 522, "loss": 0.6587, "lr": 0.00011963220019737691, "epoch": 1.4885057471264367, "percentage": 49.62, "elapsed_time": "6:26:25", "remaining_time": "6:32:23"} |
|
{"current_steps": 260, "total_steps": 522, "loss": 0.6476, "lr": 0.00011897495109808107, "epoch": 1.4942528735632183, "percentage": 49.81, "elapsed_time": "6:27:10", "remaining_time": "6:30:09"} |
|
{"current_steps": 260, "total_steps": 522, "eval_loss": 0.6506026983261108, "epoch": 1.4942528735632183, "percentage": 49.81, "elapsed_time": "6:33:58", "remaining_time": "6:37:00"} |
|
{"current_steps": 261, "total_steps": 522, "loss": 0.6378, "lr": 0.00011831685059985262, "epoch": 1.5, "percentage": 50.0, "elapsed_time": "6:34:45", "remaining_time": "6:34:45"} |
|
{"current_steps": 262, "total_steps": 522, "loss": 0.6679, "lr": 0.00011765792823141384, "epoch": 1.5057471264367817, "percentage": 50.19, "elapsed_time": "6:35:39", "remaining_time": "6:32:38"} |
|
{"current_steps": 263, "total_steps": 522, "loss": 0.6199, "lr": 0.00011699821355836409, "epoch": 1.5114942528735633, "percentage": 50.38, "elapsed_time": "6:36:31", "remaining_time": "6:30:29"} |
|
{"current_steps": 264, "total_steps": 522, "loss": 0.6369, "lr": 0.00011633773618185302, "epoch": 1.5172413793103448, "percentage": 50.57, "elapsed_time": "6:37:27", "remaining_time": "6:28:25"} |
|
{"current_steps": 265, "total_steps": 522, "loss": 0.6248, "lr": 0.00011567652573725262, "epoch": 1.5229885057471264, "percentage": 50.77, "elapsed_time": "6:38:18", "remaining_time": "6:26:16"} |
|
{"current_steps": 266, "total_steps": 522, "loss": 0.645, "lr": 0.00011501461189282733, "epoch": 1.528735632183908, "percentage": 50.96, "elapsed_time": "6:39:06", "remaining_time": "6:24:06"} |
|
{"current_steps": 267, "total_steps": 522, "loss": 0.6382, "lr": 0.00011435202434840287, "epoch": 1.5344827586206895, "percentage": 51.15, "elapsed_time": "6:39:59", "remaining_time": "6:22:01"} |
|
{"current_steps": 268, "total_steps": 522, "loss": 0.6064, "lr": 0.0001136887928340336, "epoch": 1.5402298850574714, "percentage": 51.34, "elapsed_time": "6:40:48", "remaining_time": "6:19:52"} |
|
{"current_steps": 269, "total_steps": 522, "loss": 0.6467, "lr": 0.00011302494710866857, "epoch": 1.5459770114942528, "percentage": 51.53, "elapsed_time": "6:41:37", "remaining_time": "6:17:43"} |
|
{"current_steps": 270, "total_steps": 522, "loss": 0.6412, "lr": 0.00011236051695881633, "epoch": 1.5517241379310345, "percentage": 51.72, "elapsed_time": "6:42:29", "remaining_time": "6:15:39"} |
|
{"current_steps": 270, "total_steps": 522, "eval_loss": 0.6497076749801636, "epoch": 1.5517241379310345, "percentage": 51.72, "elapsed_time": "6:49:17", "remaining_time": "6:22:00"} |
|
{"current_steps": 271, "total_steps": 522, "loss": 0.6659, "lr": 0.00011169553219720828, "epoch": 1.5574712643678161, "percentage": 51.92, "elapsed_time": "6:50:05", "remaining_time": "6:19:49"} |
|
{"current_steps": 272, "total_steps": 522, "loss": 0.6578, "lr": 0.00011103002266146096, "epoch": 1.5632183908045976, "percentage": 52.11, "elapsed_time": "6:50:54", "remaining_time": "6:17:40"} |
|
{"current_steps": 273, "total_steps": 522, "loss": 0.6187, "lr": 0.0001103640182127375, "epoch": 1.5689655172413794, "percentage": 52.3, "elapsed_time": "6:51:46", "remaining_time": "6:15:34"} |
|
{"current_steps": 274, "total_steps": 522, "loss": 0.6507, "lr": 0.00010969754873440743, "epoch": 1.5747126436781609, "percentage": 52.49, "elapsed_time": "6:52:37", "remaining_time": "6:13:28"} |
|
{"current_steps": 275, "total_steps": 522, "loss": 0.6381, "lr": 0.00010903064413070612, "epoch": 1.5804597701149425, "percentage": 52.68, "elapsed_time": "6:53:25", "remaining_time": "6:11:19"} |
|
{"current_steps": 276, "total_steps": 522, "loss": 0.6302, "lr": 0.00010836333432539272, "epoch": 1.5862068965517242, "percentage": 52.87, "elapsed_time": "6:54:15", "remaining_time": "6:09:13"} |
|
{"current_steps": 277, "total_steps": 522, "loss": 0.618, "lr": 0.00010769564926040769, "epoch": 1.5919540229885056, "percentage": 53.07, "elapsed_time": "6:55:00", "remaining_time": "6:07:03"} |
|
{"current_steps": 278, "total_steps": 522, "loss": 0.6308, "lr": 0.0001070276188945293, "epoch": 1.5977011494252875, "percentage": 53.26, "elapsed_time": "6:55:44", "remaining_time": "6:04:54"} |
|
{"current_steps": 279, "total_steps": 522, "loss": 0.6316, "lr": 0.00010635927320202928, "epoch": 1.603448275862069, "percentage": 53.45, "elapsed_time": "6:56:39", "remaining_time": "6:02:53"} |
|
{"current_steps": 280, "total_steps": 522, "loss": 0.6232, "lr": 0.00010569064217132791, "epoch": 1.6091954022988506, "percentage": 53.64, "elapsed_time": "6:57:28", "remaining_time": "6:00:49"} |
|
{"current_steps": 280, "total_steps": 522, "eval_loss": 0.6484516859054565, "epoch": 1.6091954022988506, "percentage": 53.64, "elapsed_time": "7:04:14", "remaining_time": "6:06:40"} |
|
{"current_steps": 281, "total_steps": 522, "loss": 0.6207, "lr": 0.00010502175580364857, "epoch": 1.6149425287356323, "percentage": 53.83, "elapsed_time": "7:05:05", "remaining_time": "6:04:34"} |
|
{"current_steps": 282, "total_steps": 522, "loss": 0.6604, "lr": 0.00010435264411167148, "epoch": 1.6206896551724137, "percentage": 54.02, "elapsed_time": "7:05:55", "remaining_time": "6:02:29"} |
|
{"current_steps": 283, "total_steps": 522, "loss": 0.6444, "lr": 0.0001036833371181871, "epoch": 1.6264367816091954, "percentage": 54.21, "elapsed_time": "7:06:46", "remaining_time": "6:00:24"} |
|
{"current_steps": 284, "total_steps": 522, "loss": 0.6439, "lr": 0.00010301386485474889, "epoch": 1.632183908045977, "percentage": 54.41, "elapsed_time": "7:07:36", "remaining_time": "5:58:20"} |
|
{"current_steps": 285, "total_steps": 522, "loss": 0.639, "lr": 0.00010234425736032607, "epoch": 1.6379310344827587, "percentage": 54.6, "elapsed_time": "7:08:21", "remaining_time": "5:56:13"} |
|
{"current_steps": 286, "total_steps": 522, "loss": 0.6056, "lr": 0.00010167454467995549, "epoch": 1.6436781609195403, "percentage": 54.79, "elapsed_time": "7:09:11", "remaining_time": "5:54:09"} |
|
{"current_steps": 287, "total_steps": 522, "loss": 0.6341, "lr": 0.00010100475686339379, "epoch": 1.6494252873563218, "percentage": 54.98, "elapsed_time": "7:09:59", "remaining_time": "5:52:05"} |
|
{"current_steps": 288, "total_steps": 522, "loss": 0.6193, "lr": 0.00010033492396376878, "epoch": 1.6551724137931034, "percentage": 55.17, "elapsed_time": "7:10:47", "remaining_time": "5:50:00"} |
|
{"current_steps": 289, "total_steps": 522, "loss": 0.6227, "lr": 9.966507603623125e-05, "epoch": 1.660919540229885, "percentage": 55.36, "elapsed_time": "7:11:34", "remaining_time": "5:47:56"} |
|
{"current_steps": 290, "total_steps": 522, "loss": 0.6243, "lr": 9.899524313660624e-05, "epoch": 1.6666666666666665, "percentage": 55.56, "elapsed_time": "7:12:25", "remaining_time": "5:45:56"} |
|
{"current_steps": 290, "total_steps": 522, "eval_loss": 0.6477526426315308, "epoch": 1.6666666666666665, "percentage": 55.56, "elapsed_time": "7:19:10", "remaining_time": "5:51:20"} |
|
{"current_steps": 291, "total_steps": 522, "loss": 0.6328, "lr": 9.832545532004454e-05, "epoch": 1.6724137931034484, "percentage": 55.75, "elapsed_time": "7:20:02", "remaining_time": "5:49:18"} |
|
{"current_steps": 292, "total_steps": 522, "loss": 0.6212, "lr": 9.765574263967396e-05, "epoch": 1.6781609195402298, "percentage": 55.94, "elapsed_time": "7:20:51", "remaining_time": "5:47:15"} |
|
{"current_steps": 293, "total_steps": 522, "loss": 0.6563, "lr": 9.698613514525116e-05, "epoch": 1.6839080459770115, "percentage": 56.13, "elapsed_time": "7:21:41", "remaining_time": "5:45:12"} |
|
{"current_steps": 294, "total_steps": 522, "loss": 0.6278, "lr": 9.631666288181293e-05, "epoch": 1.6896551724137931, "percentage": 56.32, "elapsed_time": "7:22:35", "remaining_time": "5:43:14"} |
|
{"current_steps": 295, "total_steps": 522, "loss": 0.6376, "lr": 9.564735588832856e-05, "epoch": 1.6954022988505746, "percentage": 56.51, "elapsed_time": "7:23:20", "remaining_time": "5:41:08"} |
|
{"current_steps": 296, "total_steps": 522, "loss": 0.6149, "lr": 9.497824419635144e-05, "epoch": 1.7011494252873565, "percentage": 56.7, "elapsed_time": "7:24:10", "remaining_time": "5:39:08"} |
|
{"current_steps": 297, "total_steps": 522, "loss": 0.6048, "lr": 9.430935782867212e-05, "epoch": 1.706896551724138, "percentage": 56.9, "elapsed_time": "7:24:59", "remaining_time": "5:37:06"} |
|
{"current_steps": 298, "total_steps": 522, "loss": 0.6292, "lr": 9.364072679797073e-05, "epoch": 1.7126436781609196, "percentage": 57.09, "elapsed_time": "7:25:56", "remaining_time": "5:35:12"} |
|
{"current_steps": 299, "total_steps": 522, "loss": 0.6464, "lr": 9.297238110547074e-05, "epoch": 1.7183908045977012, "percentage": 57.28, "elapsed_time": "7:26:42", "remaining_time": "5:33:09"} |
|
{"current_steps": 300, "total_steps": 522, "loss": 0.6467, "lr": 9.230435073959232e-05, "epoch": 1.7241379310344827, "percentage": 57.47, "elapsed_time": "7:27:27", "remaining_time": "5:31:07"} |
|
{"current_steps": 300, "total_steps": 522, "eval_loss": 0.6469475030899048, "epoch": 1.7241379310344827, "percentage": 57.47, "elapsed_time": "7:34:16", "remaining_time": "5:36:09"} |
|
{"current_steps": 301, "total_steps": 522, "loss": 0.6268, "lr": 9.163666567460733e-05, "epoch": 1.7298850574712645, "percentage": 57.66, "elapsed_time": "7:35:02", "remaining_time": "5:34:06"} |
|
{"current_steps": 302, "total_steps": 522, "loss": 0.6367, "lr": 9.096935586929392e-05, "epoch": 1.735632183908046, "percentage": 57.85, "elapsed_time": "7:35:50", "remaining_time": "5:32:04"} |
|
{"current_steps": 303, "total_steps": 522, "loss": 0.6318, "lr": 9.030245126559262e-05, "epoch": 1.7413793103448276, "percentage": 58.05, "elapsed_time": "7:36:38", "remaining_time": "5:30:02"} |
|
{"current_steps": 304, "total_steps": 522, "loss": 0.6399, "lr": 8.963598178726254e-05, "epoch": 1.7471264367816093, "percentage": 58.24, "elapsed_time": "7:37:25", "remaining_time": "5:28:01"} |
|
{"current_steps": 305, "total_steps": 522, "loss": 0.6203, "lr": 8.896997733853903e-05, "epoch": 1.7528735632183907, "percentage": 58.43, "elapsed_time": "7:38:13", "remaining_time": "5:26:00"} |
|
{"current_steps": 306, "total_steps": 522, "loss": 0.6816, "lr": 8.830446780279176e-05, "epoch": 1.7586206896551724, "percentage": 58.62, "elapsed_time": "7:39:04", "remaining_time": "5:24:03"} |
|
{"current_steps": 307, "total_steps": 522, "loss": 0.6442, "lr": 8.763948304118368e-05, "epoch": 1.764367816091954, "percentage": 58.81, "elapsed_time": "7:39:54", "remaining_time": "5:22:04"} |
|
{"current_steps": 308, "total_steps": 522, "loss": 0.6445, "lr": 8.697505289133145e-05, "epoch": 1.7701149425287355, "percentage": 59.0, "elapsed_time": "7:40:37", "remaining_time": "5:20:02"} |
|
{"current_steps": 309, "total_steps": 522, "loss": 0.6374, "lr": 8.631120716596641e-05, "epoch": 1.7758620689655173, "percentage": 59.2, "elapsed_time": "7:41:28", "remaining_time": "5:18:06"} |
|
{"current_steps": 310, "total_steps": 522, "loss": 0.6146, "lr": 8.564797565159714e-05, "epoch": 1.7816091954022988, "percentage": 59.39, "elapsed_time": "7:42:17", "remaining_time": "5:16:09"} |
|
{"current_steps": 310, "total_steps": 522, "eval_loss": 0.6459708213806152, "epoch": 1.7816091954022988, "percentage": 59.39, "elapsed_time": "7:49:03", "remaining_time": "5:20:46"} |
|
{"current_steps": 311, "total_steps": 522, "loss": 0.6679, "lr": 8.498538810717267e-05, "epoch": 1.7873563218390804, "percentage": 59.58, "elapsed_time": "7:49:52", "remaining_time": "5:18:47"} |
|
{"current_steps": 312, "total_steps": 522, "loss": 0.642, "lr": 8.432347426274739e-05, "epoch": 1.793103448275862, "percentage": 59.77, "elapsed_time": "7:50:41", "remaining_time": "5:16:48"} |
|
{"current_steps": 313, "total_steps": 522, "loss": 0.6354, "lr": 8.366226381814697e-05, "epoch": 1.7988505747126435, "percentage": 59.96, "elapsed_time": "7:51:27", "remaining_time": "5:14:48"} |
|
{"current_steps": 314, "total_steps": 522, "loss": 0.6397, "lr": 8.300178644163594e-05, "epoch": 1.8045977011494254, "percentage": 60.15, "elapsed_time": "7:52:18", "remaining_time": "5:12:51"} |
|
{"current_steps": 315, "total_steps": 522, "loss": 0.6474, "lr": 8.234207176858614e-05, "epoch": 1.8103448275862069, "percentage": 60.34, "elapsed_time": "7:53:10", "remaining_time": "5:10:56"} |
|
{"current_steps": 316, "total_steps": 522, "loss": 0.6459, "lr": 8.16831494001474e-05, "epoch": 1.8160919540229885, "percentage": 60.54, "elapsed_time": "7:53:59", "remaining_time": "5:08:59"} |
|
{"current_steps": 317, "total_steps": 522, "loss": 0.6114, "lr": 8.102504890191892e-05, "epoch": 1.8218390804597702, "percentage": 60.73, "elapsed_time": "7:54:57", "remaining_time": "5:07:09"} |
|
{"current_steps": 318, "total_steps": 522, "loss": 0.6602, "lr": 8.036779980262311e-05, "epoch": 1.8275862068965516, "percentage": 60.92, "elapsed_time": "7:55:45", "remaining_time": "5:05:12"} |
|
{"current_steps": 319, "total_steps": 522, "loss": 0.6182, "lr": 7.971143159278026e-05, "epoch": 1.8333333333333335, "percentage": 61.11, "elapsed_time": "7:56:34", "remaining_time": "5:03:16"} |
|
{"current_steps": 320, "total_steps": 522, "loss": 0.6386, "lr": 7.905597372338558e-05, "epoch": 1.839080459770115, "percentage": 61.3, "elapsed_time": "7:57:28", "remaining_time": "5:01:24"} |
|
{"current_steps": 320, "total_steps": 522, "eval_loss": 0.6449984908103943, "epoch": 1.839080459770115, "percentage": 61.3, "elapsed_time": "8:04:14", "remaining_time": "5:05:40"} |
|
{"current_steps": 321, "total_steps": 522, "loss": 0.6522, "lr": 7.840145560458756e-05, "epoch": 1.8448275862068966, "percentage": 61.49, "elapsed_time": "8:05:04", "remaining_time": "5:03:44"} |
|
{"current_steps": 322, "total_steps": 522, "loss": 0.6401, "lr": 7.774790660436858e-05, "epoch": 1.8505747126436782, "percentage": 61.69, "elapsed_time": "8:05:55", "remaining_time": "5:01:49"} |
|
{"current_steps": 323, "total_steps": 522, "loss": 0.6315, "lr": 7.709535604722684e-05, "epoch": 1.8563218390804597, "percentage": 61.88, "elapsed_time": "8:06:56", "remaining_time": "5:00:00"} |
|
{"current_steps": 324, "total_steps": 522, "loss": 0.6559, "lr": 7.644383321286094e-05, "epoch": 1.8620689655172413, "percentage": 62.07, "elapsed_time": "8:07:45", "remaining_time": "4:58:04"} |
|
{"current_steps": 325, "total_steps": 522, "loss": 0.6297, "lr": 7.579336733485584e-05, "epoch": 1.867816091954023, "percentage": 62.26, "elapsed_time": "8:08:35", "remaining_time": "4:56:09"} |
|
{"current_steps": 326, "total_steps": 522, "loss": 0.6155, "lr": 7.514398759937135e-05, "epoch": 1.8735632183908046, "percentage": 62.45, "elapsed_time": "8:09:26", "remaining_time": "4:54:16"} |
|
{"current_steps": 327, "total_steps": 522, "loss": 0.6551, "lr": 7.449572314383237e-05, "epoch": 1.8793103448275863, "percentage": 62.64, "elapsed_time": "8:10:19", "remaining_time": "4:52:23"} |
|
{"current_steps": 328, "total_steps": 522, "loss": 0.6312, "lr": 7.384860305562172e-05, "epoch": 1.8850574712643677, "percentage": 62.84, "elapsed_time": "8:11:13", "remaining_time": "4:50:32"} |
|
{"current_steps": 329, "total_steps": 522, "loss": 0.66, "lr": 7.320265637077473e-05, "epoch": 1.8908045977011494, "percentage": 63.03, "elapsed_time": "8:12:05", "remaining_time": "4:48:40"} |
|
{"current_steps": 330, "total_steps": 522, "loss": 0.6456, "lr": 7.255791207267679e-05, "epoch": 1.896551724137931, "percentage": 63.22, "elapsed_time": "8:12:53", "remaining_time": "4:46:46"} |
|
{"current_steps": 330, "total_steps": 522, "eval_loss": 0.6442980766296387, "epoch": 1.896551724137931, "percentage": 63.22, "elapsed_time": "8:19:38", "remaining_time": "4:50:41"} |
|
{"current_steps": 331, "total_steps": 522, "loss": 0.6398, "lr": 7.191439909076243e-05, "epoch": 1.9022988505747125, "percentage": 63.41, "elapsed_time": "8:20:28", "remaining_time": "4:48:47"} |
|
{"current_steps": 332, "total_steps": 522, "loss": 0.6614, "lr": 7.127214629921765e-05, "epoch": 1.9080459770114944, "percentage": 63.6, "elapsed_time": "8:21:15", "remaining_time": "4:46:51"} |
|
{"current_steps": 333, "total_steps": 522, "loss": 0.6294, "lr": 7.0631182515684e-05, "epoch": 1.9137931034482758, "percentage": 63.79, "elapsed_time": "8:22:06", "remaining_time": "4:44:58"} |
|
{"current_steps": 334, "total_steps": 522, "loss": 0.6237, "lr": 6.999153649996595e-05, "epoch": 1.9195402298850575, "percentage": 63.98, "elapsed_time": "8:23:00", "remaining_time": "4:43:07"} |
|
{"current_steps": 335, "total_steps": 522, "loss": 0.6051, "lr": 6.935323695274002e-05, "epoch": 1.9252873563218391, "percentage": 64.18, "elapsed_time": "8:23:48", "remaining_time": "4:41:13"} |
|
{"current_steps": 336, "total_steps": 522, "loss": 0.6548, "lr": 6.871631251426728e-05, "epoch": 1.9310344827586206, "percentage": 64.37, "elapsed_time": "8:24:40", "remaining_time": "4:39:22"} |
|
{"current_steps": 337, "total_steps": 522, "loss": 0.6136, "lr": 6.808079176310827e-05, "epoch": 1.9367816091954024, "percentage": 64.56, "elapsed_time": "8:25:31", "remaining_time": "4:37:31"} |
|
{"current_steps": 338, "total_steps": 522, "loss": 0.6668, "lr": 6.744670321484043e-05, "epoch": 1.9425287356321839, "percentage": 64.75, "elapsed_time": "8:26:19", "remaining_time": "4:35:37"} |
|
{"current_steps": 339, "total_steps": 522, "loss": 0.6427, "lr": 6.681407532077895e-05, "epoch": 1.9482758620689655, "percentage": 64.94, "elapsed_time": "8:27:02", "remaining_time": "4:33:42"} |
|
{"current_steps": 340, "total_steps": 522, "loss": 0.6402, "lr": 6.618293646669986e-05, "epoch": 1.9540229885057472, "percentage": 65.13, "elapsed_time": "8:27:55", "remaining_time": "4:31:53"} |
|
{"current_steps": 340, "total_steps": 522, "eval_loss": 0.6436823606491089, "epoch": 1.9540229885057472, "percentage": 65.13, "elapsed_time": "8:34:48", "remaining_time": "4:35:34"} |
|
{"current_steps": 341, "total_steps": 522, "loss": 0.6362, "lr": 6.555331497156672e-05, "epoch": 1.9597701149425286, "percentage": 65.33, "elapsed_time": "8:35:44", "remaining_time": "4:33:45"} |
|
{"current_steps": 342, "total_steps": 522, "loss": 0.6454, "lr": 6.492523908625959e-05, "epoch": 1.9655172413793105, "percentage": 65.52, "elapsed_time": "8:36:31", "remaining_time": "4:31:51"} |
|
{"current_steps": 343, "total_steps": 522, "loss": 0.6587, "lr": 6.42987369923077e-05, "epoch": 1.971264367816092, "percentage": 65.71, "elapsed_time": "8:37:22", "remaining_time": "4:29:59"} |
|
{"current_steps": 344, "total_steps": 522, "loss": 0.6369, "lr": 6.367383680062478e-05, "epoch": 1.9770114942528736, "percentage": 65.9, "elapsed_time": "8:38:10", "remaining_time": "4:28:07"} |
|
{"current_steps": 345, "total_steps": 522, "loss": 0.6382, "lr": 6.30505665502479e-05, "epoch": 1.9827586206896552, "percentage": 66.09, "elapsed_time": "8:38:56", "remaining_time": "4:26:14"} |
|
{"current_steps": 346, "total_steps": 522, "loss": 0.6238, "lr": 6.242895420707917e-05, "epoch": 1.9885057471264367, "percentage": 66.28, "elapsed_time": "8:39:45", "remaining_time": "4:24:23"} |
|
{"current_steps": 347, "total_steps": 522, "loss": 0.632, "lr": 6.180902766263113e-05, "epoch": 1.9942528735632183, "percentage": 66.48, "elapsed_time": "8:40:37", "remaining_time": "4:22:33"} |
|
{"current_steps": 348, "total_steps": 522, "loss": 0.6078, "lr": 6.119081473277501e-05, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "8:41:24", "remaining_time": "4:20:42"} |
|
{"current_steps": 349, "total_steps": 522, "loss": 0.6331, "lr": 6.057434315649304e-05, "epoch": 2.0057471264367814, "percentage": 66.86, "elapsed_time": "8:42:13", "remaining_time": "4:18:52"} |
|
{"current_steps": 350, "total_steps": 522, "loss": 0.6455, "lr": 5.99596405946333e-05, "epoch": 2.0114942528735633, "percentage": 67.05, "elapsed_time": "8:43:05", "remaining_time": "4:17:03"} |
|
{"current_steps": 350, "total_steps": 522, "eval_loss": 0.6433547139167786, "epoch": 2.0114942528735633, "percentage": 67.05, "elapsed_time": "8:49:54", "remaining_time": "4:20:24"} |
|
{"current_steps": 351, "total_steps": 522, "loss": 0.6473, "lr": 5.9346734628669065e-05, "epoch": 2.0172413793103448, "percentage": 67.24, "elapsed_time": "8:50:46", "remaining_time": "4:18:35"} |
|
{"current_steps": 352, "total_steps": 522, "loss": 0.6335, "lr": 5.873565275946088e-05, "epoch": 2.0229885057471266, "percentage": 67.43, "elapsed_time": "8:51:38", "remaining_time": "4:16:45"} |
|
{"current_steps": 353, "total_steps": 522, "loss": 0.5969, "lr": 5.8126422406022885e-05, "epoch": 2.028735632183908, "percentage": 67.62, "elapsed_time": "8:52:22", "remaining_time": "4:14:52"} |
|
{"current_steps": 354, "total_steps": 522, "loss": 0.5919, "lr": 5.7519070904292247e-05, "epoch": 2.0344827586206895, "percentage": 67.82, "elapsed_time": "8:53:11", "remaining_time": "4:13:02"} |
|
{"current_steps": 355, "total_steps": 522, "loss": 0.5909, "lr": 5.691362550590297e-05, "epoch": 2.0402298850574714, "percentage": 68.01, "elapsed_time": "8:54:00", "remaining_time": "4:11:12"} |
|
{"current_steps": 356, "total_steps": 522, "loss": 0.5959, "lr": 5.631011337696271e-05, "epoch": 2.045977011494253, "percentage": 68.2, "elapsed_time": "8:54:51", "remaining_time": "4:09:24"} |
|
{"current_steps": 357, "total_steps": 522, "loss": 0.6216, "lr": 5.570856159683418e-05, "epoch": 2.0517241379310347, "percentage": 68.39, "elapsed_time": "8:55:37", "remaining_time": "4:07:33"} |
|
{"current_steps": 358, "total_steps": 522, "loss": 0.6172, "lr": 5.510899715691984e-05, "epoch": 2.057471264367816, "percentage": 68.58, "elapsed_time": "8:56:23", "remaining_time": "4:05:43"} |
|
{"current_steps": 359, "total_steps": 522, "loss": 0.5931, "lr": 5.451144695945116e-05, "epoch": 2.0632183908045976, "percentage": 68.77, "elapsed_time": "8:57:09", "remaining_time": "4:03:53"} |
|
{"current_steps": 360, "total_steps": 522, "loss": 0.5888, "lr": 5.3915937816281095e-05, "epoch": 2.0689655172413794, "percentage": 68.97, "elapsed_time": "8:58:00", "remaining_time": "4:02:06"} |
|
{"current_steps": 360, "total_steps": 522, "eval_loss": 0.643742024898529, "epoch": 2.0689655172413794, "percentage": 68.97, "elapsed_time": "9:04:44", "remaining_time": "4:05:08"} |
|
{"current_steps": 361, "total_steps": 522, "loss": 0.6093, "lr": 5.3322496447681414e-05, "epoch": 2.074712643678161, "percentage": 69.16, "elapsed_time": "9:05:30", "remaining_time": "4:03:17"} |
|
{"current_steps": 362, "total_steps": 522, "loss": 0.6247, "lr": 5.273114948114346e-05, "epoch": 2.0804597701149423, "percentage": 69.35, "elapsed_time": "9:06:23", "remaining_time": "4:01:29"} |
|
{"current_steps": 363, "total_steps": 522, "loss": 0.6274, "lr": 5.214192345018374e-05, "epoch": 2.086206896551724, "percentage": 69.54, "elapsed_time": "9:07:13", "remaining_time": "3:59:41"} |
|
{"current_steps": 364, "total_steps": 522, "loss": 0.6243, "lr": 5.1554844793153e-05, "epoch": 2.0919540229885056, "percentage": 69.73, "elapsed_time": "9:08:01", "remaining_time": "3:57:52"} |
|
{"current_steps": 365, "total_steps": 522, "loss": 0.6149, "lr": 5.096993985205023e-05, "epoch": 2.0977011494252875, "percentage": 69.92, "elapsed_time": "9:08:48", "remaining_time": "3:56:03"} |
|
{"current_steps": 366, "total_steps": 522, "loss": 0.635, "lr": 5.0387234871340486e-05, "epoch": 2.103448275862069, "percentage": 70.11, "elapsed_time": "9:09:36", "remaining_time": "3:54:15"} |
|
{"current_steps": 367, "total_steps": 522, "loss": 0.6544, "lr": 4.980675599677757e-05, "epoch": 2.1091954022988504, "percentage": 70.31, "elapsed_time": "9:10:23", "remaining_time": "3:52:27"} |
|
{"current_steps": 368, "total_steps": 522, "loss": 0.6144, "lr": 4.9228529274230695e-05, "epoch": 2.1149425287356323, "percentage": 70.5, "elapsed_time": "9:11:08", "remaining_time": "3:50:38"} |
|
{"current_steps": 369, "total_steps": 522, "loss": 0.6217, "lr": 4.865258064851579e-05, "epoch": 2.1206896551724137, "percentage": 70.69, "elapsed_time": "9:11:56", "remaining_time": "3:48:51"} |
|
{"current_steps": 370, "total_steps": 522, "loss": 0.6267, "lr": 4.807893596223152e-05, "epoch": 2.1264367816091956, "percentage": 70.88, "elapsed_time": "9:12:46", "remaining_time": "3:47:04"} |
|
{"current_steps": 370, "total_steps": 522, "eval_loss": 0.6434890031814575, "epoch": 2.1264367816091956, "percentage": 70.88, "elapsed_time": "9:19:30", "remaining_time": "3:49:51"} |
|
{"current_steps": 371, "total_steps": 522, "loss": 0.6122, "lr": 4.75076209545996e-05, "epoch": 2.132183908045977, "percentage": 71.07, "elapsed_time": "9:20:19", "remaining_time": "3:48:03"} |
|
{"current_steps": 372, "total_steps": 522, "loss": 0.6339, "lr": 4.693866126030995e-05, "epoch": 2.1379310344827585, "percentage": 71.26, "elapsed_time": "9:21:09", "remaining_time": "3:46:16"} |
|
{"current_steps": 373, "total_steps": 522, "loss": 0.6392, "lr": 4.637208240837042e-05, "epoch": 2.1436781609195403, "percentage": 71.46, "elapsed_time": "9:22:03", "remaining_time": "3:44:31"} |
|
{"current_steps": 374, "total_steps": 522, "loss": 0.6207, "lr": 4.5807909820961494e-05, "epoch": 2.1494252873563218, "percentage": 71.65, "elapsed_time": "9:22:55", "remaining_time": "3:42:45"} |
|
{"current_steps": 375, "total_steps": 522, "loss": 0.6148, "lr": 4.5246168812295286e-05, "epoch": 2.1551724137931036, "percentage": 71.84, "elapsed_time": "9:23:43", "remaining_time": "3:40:58"} |
|
{"current_steps": 376, "total_steps": 522, "loss": 0.6306, "lr": 4.468688458748006e-05, "epoch": 2.160919540229885, "percentage": 72.03, "elapsed_time": "9:24:32", "remaining_time": "3:39:12"} |
|
{"current_steps": 377, "total_steps": 522, "loss": 0.606, "lr": 4.413008224138897e-05, "epoch": 2.1666666666666665, "percentage": 72.22, "elapsed_time": "9:25:19", "remaining_time": "3:37:26"} |
|
{"current_steps": 378, "total_steps": 522, "loss": 0.6007, "lr": 4.357578675753432e-05, "epoch": 2.1724137931034484, "percentage": 72.41, "elapsed_time": "9:26:10", "remaining_time": "3:35:41"} |
|
{"current_steps": 379, "total_steps": 522, "loss": 0.5884, "lr": 4.302402300694636e-05, "epoch": 2.17816091954023, "percentage": 72.61, "elapsed_time": "9:27:01", "remaining_time": "3:33:56"} |
|
{"current_steps": 380, "total_steps": 522, "loss": 0.6292, "lr": 4.247481574705744e-05, "epoch": 2.1839080459770113, "percentage": 72.8, "elapsed_time": "9:27:51", "remaining_time": "3:32:12"} |
|
{"current_steps": 380, "total_steps": 522, "eval_loss": 0.6433520913124084, "epoch": 2.1839080459770113, "percentage": 72.8, "elapsed_time": "9:34:36", "remaining_time": "3:34:43"} |
|
{"current_steps": 381, "total_steps": 522, "loss": 0.6103, "lr": 4.1928189620591116e-05, "epoch": 2.189655172413793, "percentage": 72.99, "elapsed_time": "9:35:19", "remaining_time": "3:32:54"} |
|
{"current_steps": 382, "total_steps": 522, "loss": 0.5852, "lr": 4.138416915445655e-05, "epoch": 2.1954022988505746, "percentage": 73.18, "elapsed_time": "9:36:12", "remaining_time": "3:31:10"} |
|
{"current_steps": 383, "total_steps": 522, "loss": 0.6467, "lr": 4.084277875864776e-05, "epoch": 2.2011494252873565, "percentage": 73.37, "elapsed_time": "9:36:59", "remaining_time": "3:29:24"} |
|
{"current_steps": 384, "total_steps": 522, "loss": 0.6112, "lr": 4.030404272514864e-05, "epoch": 2.206896551724138, "percentage": 73.56, "elapsed_time": "9:37:49", "remaining_time": "3:27:39"} |
|
{"current_steps": 385, "total_steps": 522, "loss": 0.5822, "lr": 3.9767985226842696e-05, "epoch": 2.2126436781609193, "percentage": 73.75, "elapsed_time": "9:38:37", "remaining_time": "3:25:54"} |
|
{"current_steps": 386, "total_steps": 522, "loss": 0.6137, "lr": 3.923463031642872e-05, "epoch": 2.218390804597701, "percentage": 73.95, "elapsed_time": "9:39:25", "remaining_time": "3:24:09"} |
|
{"current_steps": 387, "total_steps": 522, "loss": 0.602, "lr": 3.870400192534128e-05, "epoch": 2.2241379310344827, "percentage": 74.14, "elapsed_time": "9:40:12", "remaining_time": "3:22:23"} |
|
{"current_steps": 388, "total_steps": 522, "loss": 0.6215, "lr": 3.81761238626771e-05, "epoch": 2.2298850574712645, "percentage": 74.33, "elapsed_time": "9:41:01", "remaining_time": "3:20:39"} |
|
{"current_steps": 389, "total_steps": 522, "loss": 0.6002, "lr": 3.7651019814126654e-05, "epoch": 2.235632183908046, "percentage": 74.52, "elapsed_time": "9:41:52", "remaining_time": "3:18:56"} |
|
{"current_steps": 390, "total_steps": 522, "loss": 0.6058, "lr": 3.7128713340911535e-05, "epoch": 2.2413793103448274, "percentage": 74.71, "elapsed_time": "9:42:41", "remaining_time": "3:17:13"} |
|
{"current_steps": 390, "total_steps": 522, "eval_loss": 0.6431533098220825, "epoch": 2.2413793103448274, "percentage": 74.71, "elapsed_time": "9:49:41", "remaining_time": "3:19:35"} |
|
{"current_steps": 391, "total_steps": 522, "loss": 0.643, "lr": 3.660922787872706e-05, "epoch": 2.2471264367816093, "percentage": 74.9, "elapsed_time": "9:50:32", "remaining_time": "3:17:51"} |
|
{"current_steps": 392, "total_steps": 522, "loss": 0.5931, "lr": 3.609258673669097e-05, "epoch": 2.2528735632183907, "percentage": 75.1, "elapsed_time": "9:51:28", "remaining_time": "3:16:09"} |
|
{"current_steps": 393, "total_steps": 522, "loss": 0.5795, "lr": 3.557881309629729e-05, "epoch": 2.2586206896551726, "percentage": 75.29, "elapsed_time": "9:52:17", "remaining_time": "3:14:24"} |
|
{"current_steps": 394, "total_steps": 522, "loss": 0.6173, "lr": 3.5067930010376484e-05, "epoch": 2.264367816091954, "percentage": 75.48, "elapsed_time": "9:53:04", "remaining_time": "3:12:40"} |
|
{"current_steps": 395, "total_steps": 522, "loss": 0.6238, "lr": 3.455996040206076e-05, "epoch": 2.2701149425287355, "percentage": 75.67, "elapsed_time": "9:53:59", "remaining_time": "3:10:58"} |
|
{"current_steps": 396, "total_steps": 522, "loss": 0.6264, "lr": 3.4054927063755796e-05, "epoch": 2.2758620689655173, "percentage": 75.86, "elapsed_time": "9:54:55", "remaining_time": "3:09:17"} |
|
{"current_steps": 397, "total_steps": 522, "loss": 0.6269, "lr": 3.355285265611784e-05, "epoch": 2.281609195402299, "percentage": 76.05, "elapsed_time": "9:55:46", "remaining_time": "3:07:35"} |
|
{"current_steps": 398, "total_steps": 522, "loss": 0.6043, "lr": 3.305375970703711e-05, "epoch": 2.2873563218390807, "percentage": 76.25, "elapsed_time": "9:56:36", "remaining_time": "3:05:52"} |
|
{"current_steps": 399, "total_steps": 522, "loss": 0.6416, "lr": 3.2557670610626925e-05, "epoch": 2.293103448275862, "percentage": 76.44, "elapsed_time": "9:57:27", "remaining_time": "3:04:10"} |
|
{"current_steps": 400, "total_steps": 522, "loss": 0.6221, "lr": 3.206460762621873e-05, "epoch": 2.2988505747126435, "percentage": 76.63, "elapsed_time": "9:58:20", "remaining_time": "3:02:29"} |
|
{"current_steps": 400, "total_steps": 522, "eval_loss": 0.6427375078201294, "epoch": 2.2988505747126435, "percentage": 76.63, "elapsed_time": "10:05:06", "remaining_time": "3:04:33"} |
|
{"current_steps": 401, "total_steps": 522, "loss": 0.599, "lr": 3.157459287736362e-05, "epoch": 2.3045977011494254, "percentage": 76.82, "elapsed_time": "10:05:54", "remaining_time": "3:02:49"} |
|
{"current_steps": 402, "total_steps": 522, "loss": 0.6243, "lr": 3.108764835083938e-05, "epoch": 2.310344827586207, "percentage": 77.01, "elapsed_time": "10:06:45", "remaining_time": "3:01:07"} |
|
{"current_steps": 403, "total_steps": 522, "loss": 0.615, "lr": 3.0603795895664124e-05, "epoch": 2.3160919540229887, "percentage": 77.2, "elapsed_time": "10:07:36", "remaining_time": "2:59:25"} |
|
{"current_steps": 404, "total_steps": 522, "loss": 0.5968, "lr": 3.0123057222115836e-05, "epoch": 2.32183908045977, "percentage": 77.39, "elapsed_time": "10:08:33", "remaining_time": "2:57:44"} |
|
{"current_steps": 405, "total_steps": 522, "loss": 0.6192, "lr": 2.964545390075841e-05, "epoch": 2.3275862068965516, "percentage": 77.59, "elapsed_time": "10:09:25", "remaining_time": "2:56:03"} |
|
{"current_steps": 406, "total_steps": 522, "loss": 0.6237, "lr": 2.9171007361473514e-05, "epoch": 2.3333333333333335, "percentage": 77.78, "elapsed_time": "10:10:16", "remaining_time": "2:54:21"} |
|
{"current_steps": 407, "total_steps": 522, "loss": 0.6123, "lr": 2.8699738892499328e-05, "epoch": 2.339080459770115, "percentage": 77.97, "elapsed_time": "10:11:01", "remaining_time": "2:52:38"} |
|
{"current_steps": 408, "total_steps": 522, "loss": 0.6123, "lr": 2.8231669639475067e-05, "epoch": 2.344827586206897, "percentage": 78.16, "elapsed_time": "10:11:46", "remaining_time": "2:50:56"} |
|
{"current_steps": 409, "total_steps": 522, "loss": 0.6251, "lr": 2.776682060449247e-05, "epoch": 2.3505747126436782, "percentage": 78.35, "elapsed_time": "10:12:35", "remaining_time": "2:49:14"} |
|
{"current_steps": 410, "total_steps": 522, "loss": 0.6254, "lr": 2.7305212645153212e-05, "epoch": 2.3563218390804597, "percentage": 78.54, "elapsed_time": "10:13:29", "remaining_time": "2:47:35"} |
|
{"current_steps": 410, "total_steps": 522, "eval_loss": 0.6428195238113403, "epoch": 2.3563218390804597, "percentage": 78.54, "elapsed_time": "10:20:14", "remaining_time": "2:49:25"} |
|
{"current_steps": 411, "total_steps": 522, "loss": 0.6216, "lr": 2.6846866473633125e-05, "epoch": 2.3620689655172415, "percentage": 78.74, "elapsed_time": "10:21:00", "remaining_time": "2:47:42"} |
|
{"current_steps": 412, "total_steps": 522, "loss": 0.6052, "lr": 2.6391802655752853e-05, "epoch": 2.367816091954023, "percentage": 78.93, "elapsed_time": "10:21:50", "remaining_time": "2:46:01"} |
|
{"current_steps": 413, "total_steps": 522, "loss": 0.6007, "lr": 2.594004161005511e-05, "epoch": 2.3735632183908044, "percentage": 79.12, "elapsed_time": "10:22:42", "remaining_time": "2:44:20"} |
|
{"current_steps": 414, "total_steps": 522, "loss": 0.5876, "lr": 2.549160360688838e-05, "epoch": 2.3793103448275863, "percentage": 79.31, "elapsed_time": "10:23:31", "remaining_time": "2:42:39"} |
|
{"current_steps": 415, "total_steps": 522, "loss": 0.6183, "lr": 2.50465087674976e-05, "epoch": 2.3850574712643677, "percentage": 79.5, "elapsed_time": "10:24:27", "remaining_time": "2:41:00"} |
|
{"current_steps": 416, "total_steps": 522, "loss": 0.613, "lr": 2.4604777063121033e-05, "epoch": 2.3908045977011496, "percentage": 79.69, "elapsed_time": "10:25:21", "remaining_time": "2:39:20"} |
|
{"current_steps": 417, "total_steps": 522, "loss": 0.6443, "lr": 2.4166428314094514e-05, "epoch": 2.396551724137931, "percentage": 79.89, "elapsed_time": "10:26:08", "remaining_time": "2:37:39"} |
|
{"current_steps": 418, "total_steps": 522, "loss": 0.6062, "lr": 2.3731482188961818e-05, "epoch": 2.4022988505747125, "percentage": 80.08, "elapsed_time": "10:26:59", "remaining_time": "2:35:59"} |
|
{"current_steps": 419, "total_steps": 522, "loss": 0.6099, "lr": 2.32999582035923e-05, "epoch": 2.4080459770114944, "percentage": 80.27, "elapsed_time": "10:27:46", "remaining_time": "2:34:19"} |
|
{"current_steps": 420, "total_steps": 522, "loss": 0.6178, "lr": 2.287187572030516e-05, "epoch": 2.413793103448276, "percentage": 80.46, "elapsed_time": "10:28:40", "remaining_time": "2:32:40"} |
|
{"current_steps": 420, "total_steps": 522, "eval_loss": 0.6422638297080994, "epoch": 2.413793103448276, "percentage": 80.46, "elapsed_time": "10:35:24", "remaining_time": "2:34:18"} |
|
{"current_steps": 421, "total_steps": 522, "loss": 0.6166, "lr": 2.244725394700079e-05, "epoch": 2.4195402298850572, "percentage": 80.65, "elapsed_time": "10:36:17", "remaining_time": "2:32:38"} |
|
{"current_steps": 422, "total_steps": 522, "loss": 0.6195, "lr": 2.202611193629869e-05, "epoch": 2.425287356321839, "percentage": 80.84, "elapsed_time": "10:37:09", "remaining_time": "2:30:59"} |
|
{"current_steps": 423, "total_steps": 522, "loss": 0.6157, "lr": 2.160846858468285e-05, "epoch": 2.4310344827586206, "percentage": 81.03, "elapsed_time": "10:37:58", "remaining_time": "2:29:18"} |
|
{"current_steps": 424, "total_steps": 522, "loss": 0.6212, "lr": 2.1194342631653607e-05, "epoch": 2.4367816091954024, "percentage": 81.23, "elapsed_time": "10:38:47", "remaining_time": "2:27:38"} |
|
{"current_steps": 425, "total_steps": 522, "loss": 0.6095, "lr": 2.0783752658887066e-05, "epoch": 2.442528735632184, "percentage": 81.42, "elapsed_time": "10:39:33", "remaining_time": "2:25:58"} |
|
{"current_steps": 426, "total_steps": 522, "loss": 0.606, "lr": 2.0376717089401164e-05, "epoch": 2.4482758620689653, "percentage": 81.61, "elapsed_time": "10:40:22", "remaining_time": "2:24:18"} |
|
{"current_steps": 427, "total_steps": 522, "loss": 0.6109, "lr": 1.9973254186729086e-05, "epoch": 2.454022988505747, "percentage": 81.8, "elapsed_time": "10:41:12", "remaining_time": "2:22:39"} |
|
{"current_steps": 428, "total_steps": 522, "loss": 0.5896, "lr": 1.9573382054099786e-05, "epoch": 2.4597701149425286, "percentage": 81.99, "elapsed_time": "10:42:02", "remaining_time": "2:21:00"} |
|
{"current_steps": 429, "total_steps": 522, "loss": 0.6022, "lr": 1.9177118633625814e-05, "epoch": 2.4655172413793105, "percentage": 82.18, "elapsed_time": "10:42:57", "remaining_time": "2:19:22"} |
|
{"current_steps": 430, "total_steps": 522, "loss": 0.6161, "lr": 1.8784481705498015e-05, "epoch": 2.471264367816092, "percentage": 82.38, "elapsed_time": "10:43:42", "remaining_time": "2:17:43"} |
|
{"current_steps": 430, "total_steps": 522, "eval_loss": 0.642048180103302, "epoch": 2.471264367816092, "percentage": 82.38, "elapsed_time": "10:50:28", "remaining_time": "2:19:10"} |
|
{"current_steps": 431, "total_steps": 522, "loss": 0.581, "lr": 1.8395488887188005e-05, "epoch": 2.4770114942528734, "percentage": 82.57, "elapsed_time": "10:51:20", "remaining_time": "2:17:31"} |
|
{"current_steps": 432, "total_steps": 522, "loss": 0.6149, "lr": 1.8010157632657543e-05, "epoch": 2.4827586206896552, "percentage": 82.76, "elapsed_time": "10:52:14", "remaining_time": "2:15:53"} |
|
{"current_steps": 433, "total_steps": 522, "loss": 0.6264, "lr": 1.762850523157532e-05, "epoch": 2.4885057471264367, "percentage": 82.95, "elapsed_time": "10:53:06", "remaining_time": "2:14:14"} |
|
{"current_steps": 434, "total_steps": 522, "loss": 0.6055, "lr": 1.7250548808541322e-05, "epoch": 2.4942528735632186, "percentage": 83.14, "elapsed_time": "10:53:59", "remaining_time": "2:12:36"} |
|
{"current_steps": 435, "total_steps": 522, "loss": 0.5907, "lr": 1.687630532231833e-05, "epoch": 2.5, "percentage": 83.33, "elapsed_time": "10:54:45", "remaining_time": "2:10:57"} |
|
{"current_steps": 436, "total_steps": 522, "loss": 0.6189, "lr": 1.6505791565071138e-05, "epoch": 2.5057471264367814, "percentage": 83.52, "elapsed_time": "10:55:32", "remaining_time": "2:09:18"} |
|
{"current_steps": 437, "total_steps": 522, "loss": 0.6084, "lr": 1.613902416161288e-05, "epoch": 2.5114942528735633, "percentage": 83.72, "elapsed_time": "10:56:22", "remaining_time": "2:07:40"} |
|
{"current_steps": 438, "total_steps": 522, "loss": 0.624, "lr": 1.5776019568659338e-05, "epoch": 2.5172413793103448, "percentage": 83.91, "elapsed_time": "10:57:08", "remaining_time": "2:06:01"} |
|
{"current_steps": 439, "total_steps": 522, "loss": 0.6374, "lr": 1.5416794074090258e-05, "epoch": 2.5229885057471266, "percentage": 84.1, "elapsed_time": "10:57:57", "remaining_time": "2:04:23"} |
|
{"current_steps": 440, "total_steps": 522, "loss": 0.634, "lr": 1.5061363796218785e-05, "epoch": 2.528735632183908, "percentage": 84.29, "elapsed_time": "10:58:41", "remaining_time": "2:02:45"} |
|
{"current_steps": 440, "total_steps": 522, "eval_loss": 0.6419377326965332, "epoch": 2.528735632183908, "percentage": 84.29, "elapsed_time": "11:05:38", "remaining_time": "2:04:03"} |
|
{"current_steps": 441, "total_steps": 522, "loss": 0.6443, "lr": 1.4709744683068039e-05, "epoch": 2.5344827586206895, "percentage": 84.48, "elapsed_time": "11:06:34", "remaining_time": "2:02:25"} |
|
{"current_steps": 442, "total_steps": 522, "loss": 0.6111, "lr": 1.4361952511655618e-05, "epoch": 2.5402298850574714, "percentage": 84.67, "elapsed_time": "11:07:21", "remaining_time": "2:00:47"} |
|
{"current_steps": 443, "total_steps": 522, "loss": 0.6007, "lr": 1.4018002887285687e-05, "epoch": 2.545977011494253, "percentage": 84.87, "elapsed_time": "11:08:08", "remaining_time": "1:59:08"} |
|
{"current_steps": 444, "total_steps": 522, "loss": 0.6083, "lr": 1.3677911242848806e-05, "epoch": 2.5517241379310347, "percentage": 85.06, "elapsed_time": "11:08:52", "remaining_time": "1:57:30"} |
|
{"current_steps": 445, "total_steps": 522, "loss": 0.6227, "lr": 1.334169283812936e-05, "epoch": 2.557471264367816, "percentage": 85.25, "elapsed_time": "11:09:43", "remaining_time": "1:55:53"} |
|
{"current_steps": 446, "total_steps": 522, "loss": 0.6212, "lr": 1.300936275912098e-05, "epoch": 2.5632183908045976, "percentage": 85.44, "elapsed_time": "11:10:32", "remaining_time": "1:54:15"} |
|
{"current_steps": 447, "total_steps": 522, "loss": 0.5915, "lr": 1.2680935917349523e-05, "epoch": 2.5689655172413794, "percentage": 85.63, "elapsed_time": "11:11:22", "remaining_time": "1:52:38"} |
|
{"current_steps": 448, "total_steps": 522, "loss": 0.5972, "lr": 1.2356427049204122e-05, "epoch": 2.574712643678161, "percentage": 85.82, "elapsed_time": "11:12:13", "remaining_time": "1:51:02"} |
|
{"current_steps": 449, "total_steps": 522, "loss": 0.6358, "lr": 1.2035850715275865e-05, "epoch": 2.5804597701149428, "percentage": 86.02, "elapsed_time": "11:13:01", "remaining_time": "1:49:25"} |
|
{"current_steps": 450, "total_steps": 522, "loss": 0.6241, "lr": 1.1719221299704497e-05, "epoch": 2.586206896551724, "percentage": 86.21, "elapsed_time": "11:13:55", "remaining_time": "1:47:49"} |
|
{"current_steps": 450, "total_steps": 522, "eval_loss": 0.641758382320404, "epoch": 2.586206896551724, "percentage": 86.21, "elapsed_time": "11:20:40", "remaining_time": "1:48:54"} |
|
{"current_steps": 451, "total_steps": 522, "loss": 0.6027, "lr": 1.1406553009533027e-05, "epoch": 2.5919540229885056, "percentage": 86.4, "elapsed_time": "11:21:27", "remaining_time": "1:47:16"} |
|
{"current_steps": 452, "total_steps": 522, "loss": 0.6226, "lr": 1.1097859874070294e-05, "epoch": 2.5977011494252875, "percentage": 86.59, "elapsed_time": "11:22:20", "remaining_time": "1:45:40"} |
|
{"current_steps": 453, "total_steps": 522, "loss": 0.6145, "lr": 1.0793155744261351e-05, "epoch": 2.603448275862069, "percentage": 86.78, "elapsed_time": "11:23:09", "remaining_time": "1:44:03"} |
|
{"current_steps": 454, "total_steps": 522, "loss": 0.6131, "lr": 1.0492454292066178e-05, "epoch": 2.609195402298851, "percentage": 86.97, "elapsed_time": "11:24:05", "remaining_time": "1:42:27"} |
|
{"current_steps": 455, "total_steps": 522, "loss": 0.6312, "lr": 1.019576900984599e-05, "epoch": 2.6149425287356323, "percentage": 87.16, "elapsed_time": "11:24:58", "remaining_time": "1:40:51"} |
|
{"current_steps": 456, "total_steps": 522, "loss": 0.6167, "lr": 9.903113209758096e-06, "epoch": 2.6206896551724137, "percentage": 87.36, "elapsed_time": "11:25:45", "remaining_time": "1:39:15"} |
|
{"current_steps": 457, "total_steps": 522, "loss": 0.5969, "lr": 9.614500023158336e-06, "epoch": 2.626436781609195, "percentage": 87.55, "elapsed_time": "11:26:39", "remaining_time": "1:37:39"} |
|
{"current_steps": 458, "total_steps": 522, "loss": 0.6324, "lr": 9.32994240001206e-06, "epoch": 2.632183908045977, "percentage": 87.74, "elapsed_time": "11:27:24", "remaining_time": "1:36:03"} |
|
{"current_steps": 459, "total_steps": 522, "loss": 0.5779, "lr": 9.049453108312966e-06, "epoch": 2.637931034482759, "percentage": 87.93, "elapsed_time": "11:28:12", "remaining_time": "1:34:27"} |
|
{"current_steps": 460, "total_steps": 522, "loss": 0.6084, "lr": 8.773044733510338e-06, "epoch": 2.6436781609195403, "percentage": 88.12, "elapsed_time": "11:29:01", "remaining_time": "1:32:52"} |
|
{"current_steps": 460, "total_steps": 522, "eval_loss": 0.6415662169456482, "epoch": 2.6436781609195403, "percentage": 88.12, "elapsed_time": "11:35:45", "remaining_time": "1:33:46"} |
|
{"current_steps": 461, "total_steps": 522, "loss": 0.5962, "lr": 8.50072967794413e-06, "epoch": 2.6494252873563218, "percentage": 88.31, "elapsed_time": "11:36:33", "remaining_time": "1:32:10"} |
|
{"current_steps": 462, "total_steps": 522, "loss": 0.6276, "lr": 8.232520160288704e-06, "epoch": 2.655172413793103, "percentage": 88.51, "elapsed_time": "11:37:20", "remaining_time": "1:30:33"} |
|
{"current_steps": 463, "total_steps": 522, "loss": 0.6047, "lr": 7.96842821500442e-06, "epoch": 2.660919540229885, "percentage": 88.7, "elapsed_time": "11:38:05", "remaining_time": "1:28:57"} |
|
{"current_steps": 464, "total_steps": 522, "loss": 0.6006, "lr": 7.708465691797717e-06, "epoch": 2.6666666666666665, "percentage": 88.89, "elapsed_time": "11:38:56", "remaining_time": "1:27:22"} |
|
{"current_steps": 465, "total_steps": 522, "loss": 0.6261, "lr": 7.452644255089425e-06, "epoch": 2.6724137931034484, "percentage": 89.08, "elapsed_time": "11:39:45", "remaining_time": "1:25:46"} |
|
{"current_steps": 466, "total_steps": 522, "loss": 0.6146, "lr": 7.20097538349136e-06, "epoch": 2.67816091954023, "percentage": 89.27, "elapsed_time": "11:40:32", "remaining_time": "1:24:11"} |
|
{"current_steps": 467, "total_steps": 522, "loss": 0.6237, "lr": 6.953470369291348e-06, "epoch": 2.6839080459770113, "percentage": 89.46, "elapsed_time": "11:41:26", "remaining_time": "1:22:36"} |
|
{"current_steps": 468, "total_steps": 522, "loss": 0.643, "lr": 6.710140317946423e-06, "epoch": 2.689655172413793, "percentage": 89.66, "elapsed_time": "11:42:13", "remaining_time": "1:21:01"} |
|
{"current_steps": 469, "total_steps": 522, "loss": 0.5764, "lr": 6.470996147584685e-06, "epoch": 2.6954022988505746, "percentage": 89.85, "elapsed_time": "11:42:55", "remaining_time": "1:19:26"} |
|
{"current_steps": 470, "total_steps": 522, "loss": 0.6264, "lr": 6.236048588515242e-06, "epoch": 2.7011494252873565, "percentage": 90.04, "elapsed_time": "11:43:46", "remaining_time": "1:17:51"} |
|
{"current_steps": 470, "total_steps": 522, "eval_loss": 0.6414589881896973, "epoch": 2.7011494252873565, "percentage": 90.04, "elapsed_time": "11:50:32", "remaining_time": "1:18:36"} |
|
{"current_steps": 471, "total_steps": 522, "loss": 0.6455, "lr": 6.0053081827469045e-06, "epoch": 2.706896551724138, "percentage": 90.23, "elapsed_time": "11:51:21", "remaining_time": "1:17:01"} |
|
{"current_steps": 472, "total_steps": 522, "loss": 0.6254, "lr": 5.778785283515053e-06, "epoch": 2.7126436781609193, "percentage": 90.42, "elapsed_time": "11:52:09", "remaining_time": "1:15:26"} |
|
{"current_steps": 473, "total_steps": 522, "loss": 0.6284, "lr": 5.556490054817132e-06, "epoch": 2.718390804597701, "percentage": 90.61, "elapsed_time": "11:53:04", "remaining_time": "1:13:52"} |
|
{"current_steps": 474, "total_steps": 522, "loss": 0.6092, "lr": 5.338432470956589e-06, "epoch": 2.7241379310344827, "percentage": 90.8, "elapsed_time": "11:53:52", "remaining_time": "1:12:17"} |
|
{"current_steps": 475, "total_steps": 522, "loss": 0.6489, "lr": 5.1246223160953845e-06, "epoch": 2.7298850574712645, "percentage": 91.0, "elapsed_time": "11:54:44", "remaining_time": "1:10:43"} |
|
{"current_steps": 476, "total_steps": 522, "loss": 0.6154, "lr": 4.91506918381488e-06, "epoch": 2.735632183908046, "percentage": 91.19, "elapsed_time": "11:55:35", "remaining_time": "1:09:09"} |
|
{"current_steps": 477, "total_steps": 522, "loss": 0.6232, "lr": 4.7097824766854756e-06, "epoch": 2.7413793103448274, "percentage": 91.38, "elapsed_time": "11:56:21", "remaining_time": "1:07:34"} |
|
{"current_steps": 478, "total_steps": 522, "loss": 0.6209, "lr": 4.508771405844636e-06, "epoch": 2.7471264367816093, "percentage": 91.57, "elapsed_time": "11:57:11", "remaining_time": "1:06:01"} |
|
{"current_steps": 479, "total_steps": 522, "loss": 0.6298, "lr": 4.312044990583675e-06, "epoch": 2.7528735632183907, "percentage": 91.76, "elapsed_time": "11:58:01", "remaining_time": "1:04:27"} |
|
{"current_steps": 480, "total_steps": 522, "loss": 0.608, "lr": 4.119612057942978e-06, "epoch": 2.7586206896551726, "percentage": 91.95, "elapsed_time": "11:58:54", "remaining_time": "1:02:54"} |
|
{"current_steps": 480, "total_steps": 522, "eval_loss": 0.6413341164588928, "epoch": 2.7586206896551726, "percentage": 91.95, "elapsed_time": "12:05:44", "remaining_time": "1:03:30"} |
|
{"current_steps": 481, "total_steps": 522, "loss": 0.6426, "lr": 3.931481242315993e-06, "epoch": 2.764367816091954, "percentage": 92.15, "elapsed_time": "12:06:38", "remaining_time": "1:01:56"} |
|
{"current_steps": 482, "total_steps": 522, "loss": 0.6126, "lr": 3.747660985061785e-06, "epoch": 2.7701149425287355, "percentage": 92.34, "elapsed_time": "12:07:27", "remaining_time": "1:00:22"} |
|
{"current_steps": 483, "total_steps": 522, "loss": 0.5786, "lr": 3.568159534126314e-06, "epoch": 2.7758620689655173, "percentage": 92.53, "elapsed_time": "12:08:19", "remaining_time": "0:58:48"} |
|
{"current_steps": 484, "total_steps": 522, "loss": 0.6341, "lr": 3.3929849436722728e-06, "epoch": 2.781609195402299, "percentage": 92.72, "elapsed_time": "12:09:16", "remaining_time": "0:57:15"} |
|
{"current_steps": 485, "total_steps": 522, "loss": 0.6062, "lr": 3.2221450737178083e-06, "epoch": 2.7873563218390807, "percentage": 92.91, "elapsed_time": "12:10:07", "remaining_time": "0:55:41"} |
|
{"current_steps": 486, "total_steps": 522, "loss": 0.5974, "lr": 3.0556475897837166e-06, "epoch": 2.793103448275862, "percentage": 93.1, "elapsed_time": "12:10:58", "remaining_time": "0:54:08"} |
|
{"current_steps": 487, "total_steps": 522, "loss": 0.6157, "lr": 2.8934999625496282e-06, "epoch": 2.7988505747126435, "percentage": 93.3, "elapsed_time": "12:11:45", "remaining_time": "0:52:35"} |
|
{"current_steps": 488, "total_steps": 522, "loss": 0.625, "lr": 2.735709467518699e-06, "epoch": 2.8045977011494254, "percentage": 93.49, "elapsed_time": "12:12:37", "remaining_time": "0:51:02"} |
|
{"current_steps": 489, "total_steps": 522, "loss": 0.5991, "lr": 2.5822831846912033e-06, "epoch": 2.810344827586207, "percentage": 93.68, "elapsed_time": "12:13:30", "remaining_time": "0:49:30"} |
|
{"current_steps": 490, "total_steps": 522, "loss": 0.6039, "lr": 2.4332279982468453e-06, "epoch": 2.8160919540229887, "percentage": 93.87, "elapsed_time": "12:14:21", "remaining_time": "0:47:57"} |
|
{"current_steps": 490, "total_steps": 522, "eval_loss": 0.6412601470947266, "epoch": 2.8160919540229887, "percentage": 93.87, "elapsed_time": "12:21:07", "remaining_time": "0:48:23"} |
|
{"current_steps": 491, "total_steps": 522, "loss": 0.5907, "lr": 2.2885505962359054e-06, "epoch": 2.82183908045977, "percentage": 94.06, "elapsed_time": "12:22:06", "remaining_time": "0:46:51"} |
|
{"current_steps": 492, "total_steps": 522, "loss": 0.615, "lr": 2.1482574702790803e-06, "epoch": 2.8275862068965516, "percentage": 94.25, "elapsed_time": "12:22:52", "remaining_time": "0:45:17"} |
|
{"current_steps": 493, "total_steps": 522, "loss": 0.6334, "lr": 2.0123549152762823e-06, "epoch": 2.8333333333333335, "percentage": 94.44, "elapsed_time": "12:23:41", "remaining_time": "0:43:44"} |
|
{"current_steps": 494, "total_steps": 522, "loss": 0.6186, "lr": 1.8808490291241432e-06, "epoch": 2.839080459770115, "percentage": 94.64, "elapsed_time": "12:24:30", "remaining_time": "0:42:11"} |
|
{"current_steps": 495, "total_steps": 522, "loss": 0.6324, "lr": 1.7537457124423895e-06, "epoch": 2.844827586206897, "percentage": 94.83, "elapsed_time": "12:25:19", "remaining_time": "0:40:39"} |
|
{"current_steps": 496, "total_steps": 522, "loss": 0.6406, "lr": 1.631050668309131e-06, "epoch": 2.8505747126436782, "percentage": 95.02, "elapsed_time": "12:26:07", "remaining_time": "0:39:06"} |
|
{"current_steps": 497, "total_steps": 522, "loss": 0.6253, "lr": 1.5127694020049432e-06, "epoch": 2.8563218390804597, "percentage": 95.21, "elapsed_time": "12:26:58", "remaining_time": "0:37:34"} |
|
{"current_steps": 498, "total_steps": 522, "loss": 0.6158, "lr": 1.3989072207658328e-06, "epoch": 2.862068965517241, "percentage": 95.4, "elapsed_time": "12:27:48", "remaining_time": "0:36:02"} |
|
{"current_steps": 499, "total_steps": 522, "loss": 0.6091, "lr": 1.2894692335451375e-06, "epoch": 2.867816091954023, "percentage": 95.59, "elapsed_time": "12:28:37", "remaining_time": "0:34:30"} |
|
{"current_steps": 500, "total_steps": 522, "loss": 0.6445, "lr": 1.1844603507842668e-06, "epoch": 2.873563218390805, "percentage": 95.79, "elapsed_time": "12:29:29", "remaining_time": "0:32:58"} |
|
{"current_steps": 500, "total_steps": 522, "eval_loss": 0.641264796257019, "epoch": 2.873563218390805, "percentage": 95.79, "elapsed_time": "12:36:14", "remaining_time": "0:33:16"} |
|
{"current_steps": 501, "total_steps": 522, "loss": 0.6061, "lr": 1.083885284192354e-06, "epoch": 2.8793103448275863, "percentage": 95.98, "elapsed_time": "12:37:04", "remaining_time": "0:31:44"} |
|
{"current_steps": 502, "total_steps": 522, "loss": 0.5868, "lr": 9.877485465349058e-07, "epoch": 2.8850574712643677, "percentage": 96.17, "elapsed_time": "12:37:54", "remaining_time": "0:30:11"} |
|
{"current_steps": 503, "total_steps": 522, "loss": 0.6219, "lr": 8.960544514312275e-07, "epoch": 2.890804597701149, "percentage": 96.36, "elapsed_time": "12:38:44", "remaining_time": "0:28:39"} |
|
{"current_steps": 504, "total_steps": 522, "loss": 0.6043, "lr": 8.088071131609587e-07, "epoch": 2.896551724137931, "percentage": 96.55, "elapsed_time": "12:39:32", "remaining_time": "0:27:07"} |
|
{"current_steps": 505, "total_steps": 522, "loss": 0.622, "lr": 7.26010446479397e-07, "epoch": 2.9022988505747125, "percentage": 96.74, "elapsed_time": "12:40:22", "remaining_time": "0:25:35"} |
|
{"current_steps": 506, "total_steps": 522, "loss": 0.5829, "lr": 6.476681664419171e-07, "epoch": 2.9080459770114944, "percentage": 96.93, "elapsed_time": "12:41:10", "remaining_time": "0:24:04"} |
|
{"current_steps": 507, "total_steps": 522, "loss": 0.6162, "lr": 5.737837882371922e-07, "epoch": 2.913793103448276, "percentage": 97.13, "elapsed_time": "12:42:00", "remaining_time": "0:22:32"} |
|
{"current_steps": 508, "total_steps": 522, "loss": 0.604, "lr": 5.043606270295654e-07, "epoch": 2.9195402298850572, "percentage": 97.32, "elapsed_time": "12:42:49", "remaining_time": "0:21:01"} |
|
{"current_steps": 509, "total_steps": 522, "loss": 0.6291, "lr": 4.3940179781019055e-07, "epoch": 2.925287356321839, "percentage": 97.51, "elapsed_time": "12:43:32", "remaining_time": "0:19:30"} |
|
{"current_steps": 510, "total_steps": 522, "loss": 0.6249, "lr": 3.789102152573665e-07, "epoch": 2.9310344827586206, "percentage": 97.7, "elapsed_time": "12:44:23", "remaining_time": "0:17:59"} |
|
{"current_steps": 510, "total_steps": 522, "eval_loss": 0.6412717700004578, "epoch": 2.9310344827586206, "percentage": 97.7, "elapsed_time": "12:51:08", "remaining_time": "0:18:08"} |
|
{"current_steps": 511, "total_steps": 522, "loss": 0.6103, "lr": 3.228885936056858e-07, "epoch": 2.9367816091954024, "percentage": 97.89, "elapsed_time": "12:51:52", "remaining_time": "0:16:36"} |
|
{"current_steps": 512, "total_steps": 522, "loss": 0.5975, "lr": 2.713394465242991e-07, "epoch": 2.942528735632184, "percentage": 98.08, "elapsed_time": "12:52:37", "remaining_time": "0:15:05"} |
|
{"current_steps": 513, "total_steps": 522, "loss": 0.6018, "lr": 2.242650870040497e-07, "epoch": 2.9482758620689653, "percentage": 98.28, "elapsed_time": "12:53:30", "remaining_time": "0:13:34"} |
|
{"current_steps": 514, "total_steps": 522, "loss": 0.5967, "lr": 1.8166762725381203e-07, "epoch": 2.954022988505747, "percentage": 98.47, "elapsed_time": "12:54:15", "remaining_time": "0:12:03"} |
|
{"current_steps": 515, "total_steps": 522, "loss": 0.6012, "lr": 1.4354897860558992e-07, "epoch": 2.9597701149425286, "percentage": 98.66, "elapsed_time": "12:55:04", "remaining_time": "0:10:32"} |
|
{"current_steps": 516, "total_steps": 522, "loss": 0.5863, "lr": 1.0991085142886271e-07, "epoch": 2.9655172413793105, "percentage": 98.85, "elapsed_time": "12:55:52", "remaining_time": "0:09:01"} |
|
{"current_steps": 517, "total_steps": 522, "loss": 0.6229, "lr": 8.075475505373575e-08, "epoch": 2.971264367816092, "percentage": 99.04, "elapsed_time": "12:56:46", "remaining_time": "0:07:30"} |
|
{"current_steps": 518, "total_steps": 522, "loss": 0.6239, "lr": 5.608199770334999e-08, "epoch": 2.9770114942528734, "percentage": 99.23, "elapsed_time": "12:57:35", "remaining_time": "0:06:00"} |
|
{"current_steps": 519, "total_steps": 522, "loss": 0.6178, "lr": 3.5893686435029e-08, "epoch": 2.9827586206896552, "percentage": 99.43, "elapsed_time": "12:58:26", "remaining_time": "0:04:29"} |
|
{"current_steps": 520, "total_steps": 522, "loss": 0.6006, "lr": 2.019072709074088e-08, "epoch": 2.9885057471264367, "percentage": 99.62, "elapsed_time": "12:59:19", "remaining_time": "0:02:59"} |
|
{"current_steps": 520, "total_steps": 522, "eval_loss": 0.6412657499313354, "epoch": 2.9885057471264367, "percentage": 99.62, "elapsed_time": "13:06:06", "remaining_time": "0:03:01"} |
|
{"current_steps": 521, "total_steps": 522, "loss": 0.6094, "lr": 8.973824256364171e-09, "epoch": 2.9942528735632186, "percentage": 99.81, "elapsed_time": "13:06:59", "remaining_time": "0:01:30"} |
|
{"current_steps": 522, "total_steps": 522, "loss": 0.6062, "lr": 2.2434812301352913e-09, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "13:07:45", "remaining_time": "0:00:00"} |
|
{"current_steps": 522, "total_steps": 522, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "13:07:48", "remaining_time": "0:00:00"} |
|
|