EFAGen-Llama-3.1-Instruct-8B / trainer_log.jsonl
codezakh's picture
Upload folder using huggingface_hub
48830f7 verified
{"current_steps": 10, "total_steps": 1431, "loss": 0.341, "learning_rate": 6.944444444444445e-06, "epoch": 0.020942408376963352, "percentage": 0.7, "elapsed_time": "0:01:27", "remaining_time": "3:26:57"}
{"current_steps": 20, "total_steps": 1431, "loss": 0.3137, "learning_rate": 1.388888888888889e-05, "epoch": 0.041884816753926704, "percentage": 1.4, "elapsed_time": "0:02:54", "remaining_time": "3:25:29"}
{"current_steps": 30, "total_steps": 1431, "loss": 0.2399, "learning_rate": 2.0833333333333336e-05, "epoch": 0.06282722513089005, "percentage": 2.1, "elapsed_time": "0:04:21", "remaining_time": "3:23:32"}
{"current_steps": 40, "total_steps": 1431, "loss": 0.1832, "learning_rate": 2.777777777777778e-05, "epoch": 0.08376963350785341, "percentage": 2.8, "elapsed_time": "0:05:46", "remaining_time": "3:20:44"}
{"current_steps": 50, "total_steps": 1431, "loss": 0.151, "learning_rate": 3.472222222222222e-05, "epoch": 0.10471204188481675, "percentage": 3.49, "elapsed_time": "0:07:09", "remaining_time": "3:17:38"}
{"current_steps": 60, "total_steps": 1431, "loss": 0.129, "learning_rate": 4.166666666666667e-05, "epoch": 0.1256544502617801, "percentage": 4.19, "elapsed_time": "0:08:33", "remaining_time": "3:15:23"}
{"current_steps": 70, "total_steps": 1431, "loss": 0.1248, "learning_rate": 4.8611111111111115e-05, "epoch": 0.14659685863874344, "percentage": 4.89, "elapsed_time": "0:10:00", "remaining_time": "3:14:26"}
{"current_steps": 80, "total_steps": 1431, "loss": 0.1142, "learning_rate": 5.555555555555556e-05, "epoch": 0.16753926701570682, "percentage": 5.59, "elapsed_time": "0:11:25", "remaining_time": "3:12:56"}
{"current_steps": 90, "total_steps": 1431, "loss": 0.1103, "learning_rate": 6.25e-05, "epoch": 0.18848167539267016, "percentage": 6.29, "elapsed_time": "0:12:48", "remaining_time": "3:10:48"}
{"current_steps": 100, "total_steps": 1431, "loss": 0.0985, "learning_rate": 6.944444444444444e-05, "epoch": 0.2094240837696335, "percentage": 6.99, "elapsed_time": "0:14:12", "remaining_time": "3:09:05"}
{"current_steps": 110, "total_steps": 1431, "loss": 0.0929, "learning_rate": 7.638888888888889e-05, "epoch": 0.23036649214659685, "percentage": 7.69, "elapsed_time": "0:15:37", "remaining_time": "3:07:34"}
{"current_steps": 120, "total_steps": 1431, "loss": 0.0955, "learning_rate": 8.333333333333334e-05, "epoch": 0.2513089005235602, "percentage": 8.39, "elapsed_time": "0:17:03", "remaining_time": "3:06:22"}
{"current_steps": 130, "total_steps": 1431, "loss": 0.0941, "learning_rate": 9.027777777777779e-05, "epoch": 0.27225130890052357, "percentage": 9.08, "elapsed_time": "0:18:30", "remaining_time": "3:05:13"}
{"current_steps": 140, "total_steps": 1431, "loss": 0.0906, "learning_rate": 9.722222222222223e-05, "epoch": 0.2931937172774869, "percentage": 9.78, "elapsed_time": "0:19:51", "remaining_time": "3:03:10"}
{"current_steps": 150, "total_steps": 1431, "loss": 0.0815, "learning_rate": 9.999463737538053e-05, "epoch": 0.31413612565445026, "percentage": 10.48, "elapsed_time": "0:21:15", "remaining_time": "3:01:29"}
{"current_steps": 160, "total_steps": 1431, "loss": 0.0803, "learning_rate": 9.996186994612176e-05, "epoch": 0.33507853403141363, "percentage": 11.18, "elapsed_time": "0:22:41", "remaining_time": "3:00:14"}
{"current_steps": 170, "total_steps": 1431, "loss": 0.0797, "learning_rate": 9.989933382359422e-05, "epoch": 0.35602094240837695, "percentage": 11.88, "elapsed_time": "0:24:06", "remaining_time": "2:58:47"}
{"current_steps": 180, "total_steps": 1431, "loss": 0.0768, "learning_rate": 9.980706626858607e-05, "epoch": 0.3769633507853403, "percentage": 12.58, "elapsed_time": "0:25:29", "remaining_time": "2:57:09"}
{"current_steps": 190, "total_steps": 1431, "loss": 0.0818, "learning_rate": 9.96851222567126e-05, "epoch": 0.39790575916230364, "percentage": 13.28, "elapsed_time": "0:26:54", "remaining_time": "2:55:44"}
{"current_steps": 200, "total_steps": 1431, "loss": 0.0717, "learning_rate": 9.953357444566039e-05, "epoch": 0.418848167539267, "percentage": 13.98, "elapsed_time": "0:28:19", "remaining_time": "2:54:20"}
{"current_steps": 210, "total_steps": 1431, "loss": 0.0698, "learning_rate": 9.935251313189564e-05, "epoch": 0.4397905759162304, "percentage": 14.68, "elapsed_time": "0:29:46", "remaining_time": "2:53:08"}
{"current_steps": 220, "total_steps": 1431, "loss": 0.0745, "learning_rate": 9.914204619686314e-05, "epoch": 0.4607329842931937, "percentage": 15.37, "elapsed_time": "0:31:11", "remaining_time": "2:51:41"}
{"current_steps": 230, "total_steps": 1431, "loss": 0.0719, "learning_rate": 9.890229904270731e-05, "epoch": 0.4816753926701571, "percentage": 16.07, "elapsed_time": "0:32:35", "remaining_time": "2:50:11"}
{"current_steps": 240, "total_steps": 1431, "loss": 0.0751, "learning_rate": 9.86334145175542e-05, "epoch": 0.5026178010471204, "percentage": 16.77, "elapsed_time": "0:33:57", "remaining_time": "2:48:31"}
{"current_steps": 250, "total_steps": 1431, "loss": 0.0696, "learning_rate": 9.833555283039842e-05, "epoch": 0.5235602094240838, "percentage": 17.47, "elapsed_time": "0:35:21", "remaining_time": "2:47:03"}
{"current_steps": 260, "total_steps": 1431, "loss": 0.0594, "learning_rate": 9.800889145564617e-05, "epoch": 0.5445026178010471, "percentage": 18.17, "elapsed_time": "0:36:44", "remaining_time": "2:45:26"}
{"current_steps": 270, "total_steps": 1431, "loss": 0.0732, "learning_rate": 9.765362502737097e-05, "epoch": 0.5654450261780105, "percentage": 18.87, "elapsed_time": "0:38:09", "remaining_time": "2:44:03"}
{"current_steps": 280, "total_steps": 1431, "loss": 0.0649, "learning_rate": 9.730960252267743e-05, "epoch": 0.5863874345549738, "percentage": 19.57, "elapsed_time": "0:39:34", "remaining_time": "2:42:39"}
{"current_steps": 290, "total_steps": 1431, "loss": 0.0679, "learning_rate": 9.690058365011607e-05, "epoch": 0.6073298429319371, "percentage": 20.27, "elapsed_time": "0:40:57", "remaining_time": "2:41:07"}
{"current_steps": 300, "total_steps": 1431, "loss": 0.0787, "learning_rate": 9.646362008512602e-05, "epoch": 0.6282722513089005, "percentage": 20.96, "elapsed_time": "0:42:22", "remaining_time": "2:39:46"}
{"current_steps": 310, "total_steps": 1431, "loss": 0.072, "learning_rate": 9.599897218294122e-05, "epoch": 0.6492146596858639, "percentage": 21.66, "elapsed_time": "0:43:50", "remaining_time": "2:38:31"}
{"current_steps": 320, "total_steps": 1431, "loss": 0.065, "learning_rate": 9.550691679390558e-05, "epoch": 0.6701570680628273, "percentage": 22.36, "elapsed_time": "0:45:12", "remaining_time": "2:36:58"}
{"current_steps": 330, "total_steps": 1431, "loss": 0.0644, "learning_rate": 9.498774709851779e-05, "epoch": 0.6910994764397905, "percentage": 23.06, "elapsed_time": "0:46:39", "remaining_time": "2:35:40"}
{"current_steps": 340, "total_steps": 1431, "loss": 0.0624, "learning_rate": 9.444177243274618e-05, "epoch": 0.7120418848167539, "percentage": 23.76, "elapsed_time": "0:48:02", "remaining_time": "2:34:10"}
{"current_steps": 350, "total_steps": 1431, "loss": 0.066, "learning_rate": 9.386931810371742e-05, "epoch": 0.7329842931937173, "percentage": 24.46, "elapsed_time": "0:49:28", "remaining_time": "2:32:49"}
{"current_steps": 360, "total_steps": 1431, "loss": 0.0642, "learning_rate": 9.327072519588954e-05, "epoch": 0.7539267015706806, "percentage": 25.16, "elapsed_time": "0:50:51", "remaining_time": "2:31:17"}
{"current_steps": 370, "total_steps": 1431, "loss": 0.064, "learning_rate": 9.264635036782405e-05, "epoch": 0.774869109947644, "percentage": 25.86, "elapsed_time": "0:52:16", "remaining_time": "2:29:55"}
{"current_steps": 380, "total_steps": 1431, "loss": 0.0635, "learning_rate": 9.199656563967875e-05, "epoch": 0.7958115183246073, "percentage": 26.55, "elapsed_time": "0:53:43", "remaining_time": "2:28:34"}
{"current_steps": 390, "total_steps": 1431, "loss": 0.0617, "learning_rate": 9.132175817154763e-05, "epoch": 0.8167539267015707, "percentage": 27.25, "elapsed_time": "0:55:06", "remaining_time": "2:27:04"}
{"current_steps": 400, "total_steps": 1431, "loss": 0.0612, "learning_rate": 9.062233003277983e-05, "epoch": 0.837696335078534, "percentage": 27.95, "elapsed_time": "0:56:31", "remaining_time": "2:25:40"}
{"current_steps": 410, "total_steps": 1431, "loss": 0.0609, "learning_rate": 8.989869796241559e-05, "epoch": 0.8586387434554974, "percentage": 28.65, "elapsed_time": "0:57:55", "remaining_time": "2:24:14"}
{"current_steps": 420, "total_steps": 1431, "loss": 0.0634, "learning_rate": 8.915129312088112e-05, "epoch": 0.8795811518324608, "percentage": 29.35, "elapsed_time": "0:59:18", "remaining_time": "2:22:46"}
{"current_steps": 430, "total_steps": 1431, "loss": 0.0569, "learning_rate": 8.838056083309118e-05, "epoch": 0.900523560209424, "percentage": 30.05, "elapsed_time": "1:00:41", "remaining_time": "2:21:16"}
{"current_steps": 440, "total_steps": 1431, "loss": 0.0583, "learning_rate": 8.758696032311192e-05, "epoch": 0.9214659685863874, "percentage": 30.75, "elapsed_time": "1:02:06", "remaining_time": "2:19:53"}
{"current_steps": 450, "total_steps": 1431, "loss": 0.0637, "learning_rate": 8.677096444054213e-05, "epoch": 0.9424083769633508, "percentage": 31.45, "elapsed_time": "1:03:32", "remaining_time": "2:18:31"}
{"current_steps": 460, "total_steps": 1431, "loss": 0.0607, "learning_rate": 8.593305937877614e-05, "epoch": 0.9633507853403142, "percentage": 32.15, "elapsed_time": "1:04:58", "remaining_time": "2:17:09"}
{"current_steps": 470, "total_steps": 1431, "loss": 0.0617, "learning_rate": 8.507374438531607e-05, "epoch": 0.9842931937172775, "percentage": 32.84, "elapsed_time": "1:06:21", "remaining_time": "2:15:41"}
{"current_steps": 480, "total_steps": 1431, "loss": 0.0563, "learning_rate": 8.419353146430609e-05, "epoch": 1.0052356020942408, "percentage": 33.54, "elapsed_time": "1:07:48", "remaining_time": "2:14:19"}
{"current_steps": 490, "total_steps": 1431, "loss": 0.0415, "learning_rate": 8.329294507146579e-05, "epoch": 1.0261780104712042, "percentage": 34.24, "elapsed_time": "1:09:14", "remaining_time": "2:12:57"}
{"current_steps": 500, "total_steps": 1431, "loss": 0.0402, "learning_rate": 8.23725218016048e-05, "epoch": 1.0471204188481675, "percentage": 34.94, "elapsed_time": "1:10:38", "remaining_time": "2:11:31"}
{"current_steps": 500, "total_steps": 1431, "eval_loss": 0.058112796396017075, "epoch": 1.0471204188481675, "percentage": 34.94, "elapsed_time": "1:12:16", "remaining_time": "2:14:33"}
{"current_steps": 510, "total_steps": 1431, "loss": 0.0388, "learning_rate": 8.143281006890433e-05, "epoch": 1.068062827225131, "percentage": 35.64, "elapsed_time": "1:13:39", "remaining_time": "2:13:01"}
{"current_steps": 520, "total_steps": 1431, "loss": 0.0467, "learning_rate": 8.047436978015649e-05, "epoch": 1.0890052356020943, "percentage": 36.34, "elapsed_time": "1:15:03", "remaining_time": "2:11:29"}
{"current_steps": 530, "total_steps": 1431, "loss": 0.0414, "learning_rate": 7.949777200115616e-05, "epoch": 1.1099476439790577, "percentage": 37.04, "elapsed_time": "1:16:27", "remaining_time": "2:09:58"}
{"current_steps": 540, "total_steps": 1431, "loss": 0.0413, "learning_rate": 7.850359861644368e-05, "epoch": 1.130890052356021, "percentage": 37.74, "elapsed_time": "1:17:51", "remaining_time": "2:08:28"}
{"current_steps": 550, "total_steps": 1431, "loss": 0.0448, "learning_rate": 7.749244198260175e-05, "epoch": 1.1518324607329844, "percentage": 38.43, "elapsed_time": "1:19:16", "remaining_time": "2:06:58"}
{"current_steps": 560, "total_steps": 1431, "loss": 0.0379, "learning_rate": 7.646490457531257e-05, "epoch": 1.1727748691099475, "percentage": 39.13, "elapsed_time": "1:20:37", "remaining_time": "2:05:23"}
{"current_steps": 570, "total_steps": 1431, "loss": 0.0375, "learning_rate": 7.54215986303858e-05, "epoch": 1.193717277486911, "percentage": 39.83, "elapsed_time": "1:21:59", "remaining_time": "2:03:50"}
{"current_steps": 580, "total_steps": 1431, "loss": 0.0373, "learning_rate": 7.436314577897126e-05, "epoch": 1.2146596858638743, "percentage": 40.53, "elapsed_time": "1:23:21", "remaining_time": "2:02:19"}
{"current_steps": 590, "total_steps": 1431, "loss": 0.042, "learning_rate": 7.329017667717339e-05, "epoch": 1.2356020942408377, "percentage": 41.23, "elapsed_time": "1:24:48", "remaining_time": "2:00:53"}
{"current_steps": 600, "total_steps": 1431, "loss": 0.0379, "learning_rate": 7.220333063028872e-05, "epoch": 1.256544502617801, "percentage": 41.93, "elapsed_time": "1:26:14", "remaining_time": "1:59:26"}
{"current_steps": 610, "total_steps": 1431, "loss": 0.0444, "learning_rate": 7.110325521188949e-05, "epoch": 1.2774869109947644, "percentage": 42.63, "elapsed_time": "1:27:37", "remaining_time": "1:57:56"}
{"current_steps": 620, "total_steps": 1431, "loss": 0.0422, "learning_rate": 6.999060587798128e-05, "epoch": 1.2984293193717278, "percentage": 43.33, "elapsed_time": "1:29:00", "remaining_time": "1:56:26"}
{"current_steps": 630, "total_steps": 1431, "loss": 0.0384, "learning_rate": 6.886604557646356e-05, "epoch": 1.3193717277486912, "percentage": 44.03, "elapsed_time": "1:30:25", "remaining_time": "1:54:57"}
{"current_steps": 640, "total_steps": 1431, "loss": 0.0352, "learning_rate": 6.773024435212678e-05, "epoch": 1.3403141361256545, "percentage": 44.72, "elapsed_time": "1:31:49", "remaining_time": "1:53:29"}
{"current_steps": 650, "total_steps": 1431, "loss": 0.0397, "learning_rate": 6.658387894742071e-05, "epoch": 1.3612565445026177, "percentage": 45.42, "elapsed_time": "1:33:15", "remaining_time": "1:52:03"}
{"current_steps": 660, "total_steps": 1431, "loss": 0.0375, "learning_rate": 6.542763239923215e-05, "epoch": 1.3821989528795813, "percentage": 46.12, "elapsed_time": "1:34:40", "remaining_time": "1:50:35"}
{"current_steps": 670, "total_steps": 1431, "loss": 0.0443, "learning_rate": 6.426219363191224e-05, "epoch": 1.4031413612565444, "percentage": 46.82, "elapsed_time": "1:36:02", "remaining_time": "1:49:05"}
{"current_steps": 680, "total_steps": 1431, "loss": 0.0334, "learning_rate": 6.308825704679596e-05, "epoch": 1.4240837696335078, "percentage": 47.52, "elapsed_time": "1:37:27", "remaining_time": "1:47:37"}
{"current_steps": 690, "total_steps": 1431, "loss": 0.0401, "learning_rate": 6.190652210845815e-05, "epoch": 1.4450261780104712, "percentage": 48.22, "elapsed_time": "1:38:53", "remaining_time": "1:46:11"}
{"current_steps": 700, "total_steps": 1431, "loss": 0.0367, "learning_rate": 6.0717692927952744e-05, "epoch": 1.4659685863874345, "percentage": 48.92, "elapsed_time": "1:40:18", "remaining_time": "1:44:45"}
{"current_steps": 710, "total_steps": 1431, "loss": 0.0375, "learning_rate": 5.952247784328351e-05, "epoch": 1.486910994764398, "percentage": 49.62, "elapsed_time": "1:41:44", "remaining_time": "1:43:18"}
{"current_steps": 720, "total_steps": 1431, "loss": 0.0339, "learning_rate": 5.8321588997356326e-05, "epoch": 1.5078534031413613, "percentage": 50.31, "elapsed_time": "1:43:10", "remaining_time": "1:41:53"}
{"current_steps": 730, "total_steps": 1431, "loss": 0.0381, "learning_rate": 5.7115741913664264e-05, "epoch": 1.5287958115183247, "percentage": 51.01, "elapsed_time": "1:44:33", "remaining_time": "1:40:24"}
{"current_steps": 740, "total_steps": 1431, "loss": 0.0355, "learning_rate": 5.59056550699585e-05, "epoch": 1.5497382198952878, "percentage": 51.71, "elapsed_time": "1:45:59", "remaining_time": "1:38:58"}
{"current_steps": 750, "total_steps": 1431, "loss": 0.0374, "learning_rate": 5.469204947015897e-05, "epoch": 1.5706806282722514, "percentage": 52.41, "elapsed_time": "1:47:23", "remaining_time": "1:37:30"}
{"current_steps": 760, "total_steps": 1431, "loss": 0.0327, "learning_rate": 5.3475648214759896e-05, "epoch": 1.5916230366492146, "percentage": 53.11, "elapsed_time": "1:48:48", "remaining_time": "1:36:03"}
{"current_steps": 770, "total_steps": 1431, "loss": 0.0403, "learning_rate": 5.2257176069986036e-05, "epoch": 1.6125654450261782, "percentage": 53.81, "elapsed_time": "1:50:14", "remaining_time": "1:34:38"}
{"current_steps": 780, "total_steps": 1431, "loss": 0.0364, "learning_rate": 5.103735903595658e-05, "epoch": 1.6335078534031413, "percentage": 54.51, "elapsed_time": "1:51:41", "remaining_time": "1:33:13"}
{"current_steps": 790, "total_steps": 1431, "loss": 0.0371, "learning_rate": 4.981692391411366e-05, "epoch": 1.6544502617801047, "percentage": 55.21, "elapsed_time": "1:53:04", "remaining_time": "1:31:44"}
{"current_steps": 800, "total_steps": 1431, "loss": 0.0406, "learning_rate": 4.859659787417362e-05, "epoch": 1.675392670157068, "percentage": 55.9, "elapsed_time": "1:54:29", "remaining_time": "1:30:18"}
{"current_steps": 810, "total_steps": 1431, "loss": 0.0353, "learning_rate": 4.737710802085875e-05, "epoch": 1.6963350785340314, "percentage": 56.6, "elapsed_time": "1:55:55", "remaining_time": "1:28:52"}
{"current_steps": 820, "total_steps": 1431, "loss": 0.0325, "learning_rate": 4.615918096066766e-05, "epoch": 1.7172774869109948, "percentage": 57.3, "elapsed_time": "1:57:20", "remaining_time": "1:27:26"}
{"current_steps": 830, "total_steps": 1431, "loss": 0.0318, "learning_rate": 4.4943542368942746e-05, "epoch": 1.738219895287958, "percentage": 58.0, "elapsed_time": "1:58:48", "remaining_time": "1:26:01"}
{"current_steps": 840, "total_steps": 1431, "loss": 0.0374, "learning_rate": 4.373091655749225e-05, "epoch": 1.7591623036649215, "percentage": 58.7, "elapsed_time": "2:00:12", "remaining_time": "1:24:34"}
{"current_steps": 850, "total_steps": 1431, "loss": 0.0362, "learning_rate": 4.252202604302476e-05, "epoch": 1.7801047120418847, "percentage": 59.4, "elapsed_time": "2:01:35", "remaining_time": "1:23:06"}
{"current_steps": 860, "total_steps": 1431, "loss": 0.038, "learning_rate": 4.131759111665349e-05, "epoch": 1.8010471204188483, "percentage": 60.1, "elapsed_time": "2:03:00", "remaining_time": "1:21:40"}
{"current_steps": 870, "total_steps": 1431, "loss": 0.0393, "learning_rate": 4.011832941472641e-05, "epoch": 1.8219895287958114, "percentage": 60.8, "elapsed_time": "2:04:24", "remaining_time": "1:20:13"}
{"current_steps": 880, "total_steps": 1431, "loss": 0.0336, "learning_rate": 3.8924955491238216e-05, "epoch": 1.8429319371727748, "percentage": 61.5, "elapsed_time": "2:05:48", "remaining_time": "1:18:46"}
{"current_steps": 890, "total_steps": 1431, "loss": 0.033, "learning_rate": 3.7738180392078937e-05, "epoch": 1.8638743455497382, "percentage": 62.19, "elapsed_time": "2:07:13", "remaining_time": "1:17:19"}
{"current_steps": 900, "total_steps": 1431, "loss": 0.035, "learning_rate": 3.6558711231372704e-05, "epoch": 1.8848167539267016, "percentage": 62.89, "elapsed_time": "2:08:38", "remaining_time": "1:15:54"}
{"current_steps": 910, "total_steps": 1431, "loss": 0.0357, "learning_rate": 3.538725077015915e-05, "epoch": 1.905759162303665, "percentage": 63.59, "elapsed_time": "2:10:05", "remaining_time": "1:14:28"}
{"current_steps": 920, "total_steps": 1431, "loss": 0.0313, "learning_rate": 3.422449699766851e-05, "epoch": 1.9267015706806283, "percentage": 64.29, "elapsed_time": "2:11:30", "remaining_time": "1:13:02"}
{"current_steps": 930, "total_steps": 1431, "loss": 0.0345, "learning_rate": 3.307114271543999e-05, "epoch": 1.9476439790575917, "percentage": 64.99, "elapsed_time": "2:12:55", "remaining_time": "1:11:36"}
{"current_steps": 940, "total_steps": 1431, "loss": 0.0333, "learning_rate": 3.192787512453105e-05, "epoch": 1.9685863874345548, "percentage": 65.69, "elapsed_time": "2:14:23", "remaining_time": "1:10:11"}
{"current_steps": 950, "total_steps": 1431, "loss": 0.0317, "learning_rate": 3.079537541606349e-05, "epoch": 1.9895287958115184, "percentage": 66.39, "elapsed_time": "2:15:46", "remaining_time": "1:08:44"}
{"current_steps": 960, "total_steps": 1431, "loss": 0.0235, "learning_rate": 2.9674318365350685e-05, "epoch": 2.0104712041884816, "percentage": 67.09, "elapsed_time": "2:17:12", "remaining_time": "1:07:19"}
{"current_steps": 970, "total_steps": 1431, "loss": 0.0158, "learning_rate": 2.8565371929847284e-05, "epoch": 2.031413612565445, "percentage": 67.78, "elapsed_time": "2:18:37", "remaining_time": "1:05:53"}
{"current_steps": 980, "total_steps": 1431, "loss": 0.0179, "learning_rate": 2.7469196851161373e-05, "epoch": 2.0523560209424083, "percentage": 68.48, "elapsed_time": "2:20:00", "remaining_time": "1:04:26"}
{"current_steps": 990, "total_steps": 1431, "loss": 0.0174, "learning_rate": 2.638644626136587e-05, "epoch": 2.073298429319372, "percentage": 69.18, "elapsed_time": "2:21:27", "remaining_time": "1:03:00"}
{"current_steps": 1000, "total_steps": 1431, "loss": 0.0204, "learning_rate": 2.531776529384407e-05, "epoch": 2.094240837696335, "percentage": 69.88, "elapsed_time": "2:22:52", "remaining_time": "1:01:34"}
{"current_steps": 1000, "total_steps": 1431, "eval_loss": 0.05247209593653679, "epoch": 2.094240837696335, "percentage": 69.88, "elapsed_time": "2:24:30", "remaining_time": "1:02:16"}
{"current_steps": 1010, "total_steps": 1431, "loss": 0.0178, "learning_rate": 2.426379069890098e-05, "epoch": 2.115183246073298, "percentage": 70.58, "elapsed_time": "2:25:57", "remaining_time": "1:00:50"}
{"current_steps": 1020, "total_steps": 1431, "loss": 0.0145, "learning_rate": 2.3225150464369312e-05, "epoch": 2.136125654450262, "percentage": 71.28, "elapsed_time": "2:27:22", "remaining_time": "0:59:22"}
{"current_steps": 1030, "total_steps": 1431, "loss": 0.0186, "learning_rate": 2.2202463441436884e-05, "epoch": 2.157068062827225, "percentage": 71.98, "elapsed_time": "2:28:48", "remaining_time": "0:57:56"}
{"current_steps": 1040, "total_steps": 1431, "loss": 0.0185, "learning_rate": 2.1196338975917358e-05, "epoch": 2.1780104712041886, "percentage": 72.68, "elapsed_time": "2:30:10", "remaining_time": "0:56:27"}
{"current_steps": 1050, "total_steps": 1431, "loss": 0.0148, "learning_rate": 2.0207376545184893e-05, "epoch": 2.1989528795811517, "percentage": 73.38, "elapsed_time": "2:31:31", "remaining_time": "0:54:59"}
{"current_steps": 1060, "total_steps": 1431, "loss": 0.0188, "learning_rate": 1.9236165400988638e-05, "epoch": 2.2198952879581153, "percentage": 74.07, "elapsed_time": "2:32:56", "remaining_time": "0:53:31"}
{"current_steps": 1070, "total_steps": 1431, "loss": 0.0167, "learning_rate": 1.8283284218359782e-05, "epoch": 2.2408376963350785, "percentage": 74.77, "elapsed_time": "2:34:20", "remaining_time": "0:52:04"}
{"current_steps": 1080, "total_steps": 1431, "loss": 0.0156, "learning_rate": 1.734930075082076e-05, "epoch": 2.261780104712042, "percentage": 75.47, "elapsed_time": "2:35:47", "remaining_time": "0:50:37"}
{"current_steps": 1090, "total_steps": 1431, "loss": 0.0168, "learning_rate": 1.6434771492101485e-05, "epoch": 2.282722513089005, "percentage": 76.17, "elapsed_time": "2:37:10", "remaining_time": "0:49:10"}
{"current_steps": 1100, "total_steps": 1431, "loss": 0.0178, "learning_rate": 1.5540241344564915e-05, "epoch": 2.303664921465969, "percentage": 76.87, "elapsed_time": "2:38:36", "remaining_time": "0:47:43"}
{"current_steps": 1110, "total_steps": 1431, "loss": 0.0159, "learning_rate": 1.46662432945386e-05, "epoch": 2.324607329842932, "percentage": 77.57, "elapsed_time": "2:40:01", "remaining_time": "0:46:16"}
{"current_steps": 1120, "total_steps": 1431, "loss": 0.0155, "learning_rate": 1.3813298094746491e-05, "epoch": 2.345549738219895, "percentage": 78.27, "elapsed_time": "2:41:24", "remaining_time": "0:44:49"}
{"current_steps": 1130, "total_steps": 1431, "loss": 0.0158, "learning_rate": 1.2981913954029784e-05, "epoch": 2.3664921465968587, "percentage": 78.97, "elapsed_time": "2:42:49", "remaining_time": "0:43:22"}
{"current_steps": 1140, "total_steps": 1431, "loss": 0.0162, "learning_rate": 1.2172586234541644e-05, "epoch": 2.387434554973822, "percentage": 79.66, "elapsed_time": "2:44:13", "remaining_time": "0:41:55"}
{"current_steps": 1150, "total_steps": 1431, "loss": 0.0157, "learning_rate": 1.1385797156596506e-05, "epoch": 2.4083769633507854, "percentage": 80.36, "elapsed_time": "2:45:35", "remaining_time": "0:40:27"}
{"current_steps": 1160, "total_steps": 1431, "loss": 0.0146, "learning_rate": 1.062201551134957e-05, "epoch": 2.4293193717277486, "percentage": 81.06, "elapsed_time": "2:46:59", "remaining_time": "0:39:00"}
{"current_steps": 1170, "total_steps": 1431, "loss": 0.0143, "learning_rate": 9.88169638147784e-06, "epoch": 2.450261780104712, "percentage": 81.76, "elapsed_time": "2:48:21", "remaining_time": "0:37:33"}
{"current_steps": 1180, "total_steps": 1431, "loss": 0.017, "learning_rate": 9.16528087002892e-06, "epoch": 2.4712041884816753, "percentage": 82.46, "elapsed_time": "2:49:46", "remaining_time": "0:36:06"}
{"current_steps": 1190, "total_steps": 1431, "loss": 0.0155, "learning_rate": 8.473195837599418e-06, "epoch": 2.492146596858639, "percentage": 83.16, "elapsed_time": "2:51:11", "remaining_time": "0:34:40"}
{"current_steps": 1200, "total_steps": 1431, "loss": 0.0176, "learning_rate": 7.805853647999362e-06, "epoch": 2.513089005235602, "percentage": 83.86, "elapsed_time": "2:52:35", "remaining_time": "0:33:13"}
{"current_steps": 1210, "total_steps": 1431, "loss": 0.0194, "learning_rate": 7.163651922554149e-06, "epoch": 2.5340314136125652, "percentage": 84.56, "elapsed_time": "2:53:58", "remaining_time": "0:31:46"}
{"current_steps": 1220, "total_steps": 1431, "loss": 0.0147, "learning_rate": 6.5469733031905515e-06, "epoch": 2.554973821989529, "percentage": 85.26, "elapsed_time": "2:55:22", "remaining_time": "0:30:19"}
{"current_steps": 1230, "total_steps": 1431, "loss": 0.0146, "learning_rate": 5.956185224447841e-06, "epoch": 2.5759162303664924, "percentage": 85.95, "elapsed_time": "2:56:48", "remaining_time": "0:28:53"}
{"current_steps": 1240, "total_steps": 1431, "loss": 0.0164, "learning_rate": 5.391639694549943e-06, "epoch": 2.5968586387434556, "percentage": 86.65, "elapsed_time": "2:58:12", "remaining_time": "0:27:27"}
{"current_steps": 1250, "total_steps": 1431, "loss": 0.0148, "learning_rate": 4.853673085668947e-06, "epoch": 2.6178010471204187, "percentage": 87.35, "elapsed_time": "2:59:37", "remaining_time": "0:26:00"}
{"current_steps": 1260, "total_steps": 1431, "loss": 0.0154, "learning_rate": 4.342605933505084e-06, "epoch": 2.6387434554973823, "percentage": 88.05, "elapsed_time": "3:01:01", "remaining_time": "0:24:34"}
{"current_steps": 1270, "total_steps": 1431, "loss": 0.0153, "learning_rate": 3.858742746302535e-06, "epoch": 2.6596858638743455, "percentage": 88.75, "elapsed_time": "3:02:27", "remaining_time": "0:23:07"}
{"current_steps": 1280, "total_steps": 1431, "loss": 0.0136, "learning_rate": 3.402371823414774e-06, "epoch": 2.680628272251309, "percentage": 89.45, "elapsed_time": "3:03:50", "remaining_time": "0:21:41"}
{"current_steps": 1290, "total_steps": 1431, "loss": 0.0137, "learning_rate": 2.9737650835276853e-06, "epoch": 2.701570680628272, "percentage": 90.15, "elapsed_time": "3:05:15", "remaining_time": "0:20:14"}
{"current_steps": 1300, "total_steps": 1431, "loss": 0.0204, "learning_rate": 2.573177902642726e-06, "epoch": 2.7225130890052354, "percentage": 90.85, "elapsed_time": "3:06:41", "remaining_time": "0:18:48"}
{"current_steps": 1310, "total_steps": 1431, "loss": 0.0147, "learning_rate": 2.200848961916718e-06, "epoch": 2.743455497382199, "percentage": 91.54, "elapsed_time": "3:08:07", "remaining_time": "0:17:22"}
{"current_steps": 1320, "total_steps": 1431, "loss": 0.0175, "learning_rate": 1.8570001054488362e-06, "epoch": 2.7643979057591626, "percentage": 92.24, "elapsed_time": "3:09:32", "remaining_time": "0:15:56"}
{"current_steps": 1330, "total_steps": 1431, "loss": 0.0153, "learning_rate": 1.5418362080996507e-06, "epoch": 2.7853403141361257, "percentage": 92.94, "elapsed_time": "3:10:58", "remaining_time": "0:14:30"}
{"current_steps": 1340, "total_steps": 1431, "loss": 0.0138, "learning_rate": 1.2555450534208978e-06, "epoch": 2.806282722513089, "percentage": 93.64, "elapsed_time": "3:12:21", "remaining_time": "0:13:03"}
{"current_steps": 1350, "total_steps": 1431, "loss": 0.0142, "learning_rate": 9.98297221768718e-07, "epoch": 2.8272251308900525, "percentage": 94.34, "elapsed_time": "3:13:44", "remaining_time": "0:11:37"}
{"current_steps": 1360, "total_steps": 1431, "loss": 0.0141, "learning_rate": 7.702459886670788e-07, "epoch": 2.8481675392670156, "percentage": 95.04, "elapsed_time": "3:15:09", "remaining_time": "0:10:11"}
{"current_steps": 1370, "total_steps": 1431, "loss": 0.0162, "learning_rate": 5.715272334818944e-07, "epoch": 2.869109947643979, "percentage": 95.74, "elapsed_time": "3:16:34", "remaining_time": "0:08:45"}
{"current_steps": 1380, "total_steps": 1431, "loss": 0.0159, "learning_rate": 4.02259358460233e-07, "epoch": 2.8900523560209423, "percentage": 96.44, "elapsed_time": "3:17:59", "remaining_time": "0:07:19"}
{"current_steps": 1390, "total_steps": 1431, "loss": 0.0178, "learning_rate": 2.6254321818295345e-07, "epoch": 2.9109947643979055, "percentage": 97.13, "elapsed_time": "3:19:24", "remaining_time": "0:05:52"}
{"current_steps": 1400, "total_steps": 1431, "loss": 0.0151, "learning_rate": 1.5246205947265779e-07, "epoch": 2.931937172774869, "percentage": 97.83, "elapsed_time": "3:20:48", "remaining_time": "0:04:26"}
{"current_steps": 1410, "total_steps": 1431, "loss": 0.0156, "learning_rate": 7.208147179291192e-08, "epoch": 2.9528795811518327, "percentage": 98.53, "elapsed_time": "3:22:13", "remaining_time": "0:03:00"}
{"current_steps": 1420, "total_steps": 1431, "loss": 0.0162, "learning_rate": 2.1449348168167682e-08, "epoch": 2.973821989528796, "percentage": 99.23, "elapsed_time": "3:23:38", "remaining_time": "0:01:34"}
{"current_steps": 1430, "total_steps": 1431, "loss": 0.0136, "learning_rate": 5.95856647772619e-10, "epoch": 2.994764397905759, "percentage": 99.93, "elapsed_time": "3:25:02", "remaining_time": "0:00:08"}
{"current_steps": 1431, "total_steps": 1431, "epoch": 2.9968586387434555, "percentage": 100.0, "elapsed_time": "3:25:12", "remaining_time": "0:00:00"}