time_sft_llama3_8b_2 / trainer_log.jsonl
stamina's picture
Upload folder using huggingface_hub
ffd2cd4 verified
{"current_steps": 1, "total_steps": 154, "loss": 12.6644, "lr": 0.0, "epoch": 0.006493506493506494, "percentage": 0.65, "elapsed_time": "0:00:39", "remaining_time": "1:40:37"}
{"current_steps": 2, "total_steps": 154, "loss": 13.386, "lr": 1.25e-06, "epoch": 0.012987012987012988, "percentage": 1.3, "elapsed_time": "0:01:14", "remaining_time": "1:33:45"}
{"current_steps": 3, "total_steps": 154, "loss": 12.124, "lr": 2.5e-06, "epoch": 0.01948051948051948, "percentage": 1.95, "elapsed_time": "0:01:48", "remaining_time": "1:30:38"}
{"current_steps": 4, "total_steps": 154, "loss": 9.26, "lr": 3.7500000000000005e-06, "epoch": 0.025974025974025976, "percentage": 2.6, "elapsed_time": "0:02:22", "remaining_time": "1:29:00"}
{"current_steps": 5, "total_steps": 154, "loss": 7.0851, "lr": 5e-06, "epoch": 0.032467532467532464, "percentage": 3.25, "elapsed_time": "0:02:57", "remaining_time": "1:28:04"}
{"current_steps": 6, "total_steps": 154, "loss": 4.3426, "lr": 6.25e-06, "epoch": 0.03896103896103896, "percentage": 3.9, "elapsed_time": "0:03:32", "remaining_time": "1:27:18"}
{"current_steps": 7, "total_steps": 154, "loss": 3.9004, "lr": 7.500000000000001e-06, "epoch": 0.045454545454545456, "percentage": 4.55, "elapsed_time": "0:04:07", "remaining_time": "1:26:38"}
{"current_steps": 8, "total_steps": 154, "loss": 4.2357, "lr": 8.750000000000001e-06, "epoch": 0.05194805194805195, "percentage": 5.19, "elapsed_time": "0:04:41", "remaining_time": "1:25:42"}
{"current_steps": 9, "total_steps": 154, "loss": 3.4659, "lr": 1e-05, "epoch": 0.05844155844155844, "percentage": 5.84, "elapsed_time": "0:05:15", "remaining_time": "1:24:40"}
{"current_steps": 10, "total_steps": 154, "loss": 3.2504, "lr": 1.125e-05, "epoch": 0.06493506493506493, "percentage": 6.49, "elapsed_time": "0:05:49", "remaining_time": "1:23:45"}
{"current_steps": 11, "total_steps": 154, "loss": 6.6892, "lr": 1.25e-05, "epoch": 0.07142857142857142, "percentage": 7.14, "elapsed_time": "0:06:25", "remaining_time": "1:23:26"}
{"current_steps": 12, "total_steps": 154, "loss": 3.3174, "lr": 1.375e-05, "epoch": 0.07792207792207792, "percentage": 7.79, "elapsed_time": "0:07:00", "remaining_time": "1:22:56"}
{"current_steps": 13, "total_steps": 154, "loss": 3.8063, "lr": 1.5000000000000002e-05, "epoch": 0.08441558441558442, "percentage": 8.44, "elapsed_time": "0:07:36", "remaining_time": "1:22:35"}
{"current_steps": 14, "total_steps": 154, "loss": 2.7457, "lr": 1.6250000000000002e-05, "epoch": 0.09090909090909091, "percentage": 9.09, "elapsed_time": "0:08:11", "remaining_time": "1:21:54"}
{"current_steps": 15, "total_steps": 154, "loss": 2.7346, "lr": 1.7500000000000002e-05, "epoch": 0.09740259740259741, "percentage": 9.74, "elapsed_time": "0:08:45", "remaining_time": "1:21:07"}
{"current_steps": 16, "total_steps": 154, "loss": 3.6905, "lr": 1.8750000000000002e-05, "epoch": 0.1038961038961039, "percentage": 10.39, "elapsed_time": "0:09:20", "remaining_time": "1:20:30"}
{"current_steps": 17, "total_steps": 154, "loss": 2.7146, "lr": 2e-05, "epoch": 0.11038961038961038, "percentage": 11.04, "elapsed_time": "0:09:54", "remaining_time": "1:19:47"}
{"current_steps": 18, "total_steps": 154, "loss": 2.9735, "lr": 1.9997408848413494e-05, "epoch": 0.11688311688311688, "percentage": 11.69, "elapsed_time": "0:10:27", "remaining_time": "1:19:03"}
{"current_steps": 19, "total_steps": 154, "loss": 3.0153, "lr": 1.9989636736467278e-05, "epoch": 0.12337662337662338, "percentage": 12.34, "elapsed_time": "0:11:00", "remaining_time": "1:18:12"}
{"current_steps": 20, "total_steps": 154, "loss": 2.0634, "lr": 1.9976687691905394e-05, "epoch": 0.12987012987012986, "percentage": 12.99, "elapsed_time": "0:11:34", "remaining_time": "1:17:31"}
{"current_steps": 21, "total_steps": 154, "loss": 1.7994, "lr": 1.9958568425315316e-05, "epoch": 0.13636363636363635, "percentage": 13.64, "elapsed_time": "0:12:10", "remaining_time": "1:17:03"}
{"current_steps": 22, "total_steps": 154, "loss": 1.8646, "lr": 1.9935288326650314e-05, "epoch": 0.14285714285714285, "percentage": 14.29, "elapsed_time": "0:12:43", "remaining_time": "1:16:23"}
{"current_steps": 23, "total_steps": 154, "loss": 1.6082, "lr": 1.9906859460363307e-05, "epoch": 0.14935064935064934, "percentage": 14.94, "elapsed_time": "0:13:18", "remaining_time": "1:15:47"}
{"current_steps": 24, "total_steps": 154, "loss": 1.4584, "lr": 1.98732965591547e-05, "epoch": 0.15584415584415584, "percentage": 15.58, "elapsed_time": "0:13:53", "remaining_time": "1:15:13"}
{"current_steps": 25, "total_steps": 154, "loss": 1.2276, "lr": 1.9834617016337424e-05, "epoch": 0.16233766233766234, "percentage": 16.23, "elapsed_time": "0:14:27", "remaining_time": "1:14:38"}
{"current_steps": 26, "total_steps": 154, "loss": 1.1038, "lr": 1.979084087682323e-05, "epoch": 0.16883116883116883, "percentage": 16.88, "elapsed_time": "0:15:02", "remaining_time": "1:14:03"}
{"current_steps": 27, "total_steps": 154, "loss": 0.9448, "lr": 1.9741990826734793e-05, "epoch": 0.17532467532467533, "percentage": 17.53, "elapsed_time": "0:15:36", "remaining_time": "1:13:24"}
{"current_steps": 28, "total_steps": 154, "loss": 0.8475, "lr": 1.9688092181649065e-05, "epoch": 0.18181818181818182, "percentage": 18.18, "elapsed_time": "0:16:10", "remaining_time": "1:12:49"}
{"current_steps": 29, "total_steps": 154, "loss": 0.6988, "lr": 1.9629172873477995e-05, "epoch": 0.18831168831168832, "percentage": 18.83, "elapsed_time": "0:16:45", "remaining_time": "1:12:15"}
{"current_steps": 30, "total_steps": 154, "loss": 0.591, "lr": 1.956526343599335e-05, "epoch": 0.19480519480519481, "percentage": 19.48, "elapsed_time": "0:17:20", "remaining_time": "1:11:38"}
{"current_steps": 31, "total_steps": 154, "loss": 0.504, "lr": 1.9496396989003195e-05, "epoch": 0.2012987012987013, "percentage": 20.13, "elapsed_time": "0:17:53", "remaining_time": "1:10:58"}
{"current_steps": 32, "total_steps": 154, "loss": 0.4665, "lr": 1.9422609221188208e-05, "epoch": 0.2077922077922078, "percentage": 20.78, "elapsed_time": "0:18:27", "remaining_time": "1:10:21"}
{"current_steps": 33, "total_steps": 154, "loss": 0.4967, "lr": 1.9343938371606714e-05, "epoch": 0.21428571428571427, "percentage": 21.43, "elapsed_time": "0:18:59", "remaining_time": "1:09:36"}
{"current_steps": 34, "total_steps": 154, "loss": 0.4135, "lr": 1.9260425209878052e-05, "epoch": 0.22077922077922077, "percentage": 22.08, "elapsed_time": "0:19:32", "remaining_time": "1:08:59"}
{"current_steps": 35, "total_steps": 154, "loss": 0.5827, "lr": 1.917211301505453e-05, "epoch": 0.22727272727272727, "percentage": 22.73, "elapsed_time": "0:20:06", "remaining_time": "1:08:22"}
{"current_steps": 36, "total_steps": 154, "loss": 0.6328, "lr": 1.907904755319289e-05, "epoch": 0.23376623376623376, "percentage": 23.38, "elapsed_time": "0:20:42", "remaining_time": "1:07:51"}
{"current_steps": 37, "total_steps": 154, "loss": 0.3192, "lr": 1.8981277053636963e-05, "epoch": 0.24025974025974026, "percentage": 24.03, "elapsed_time": "0:21:17", "remaining_time": "1:07:20"}
{"current_steps": 38, "total_steps": 154, "loss": 0.437, "lr": 1.8878852184023754e-05, "epoch": 0.24675324675324675, "percentage": 24.68, "elapsed_time": "0:21:51", "remaining_time": "1:06:44"}
{"current_steps": 39, "total_steps": 154, "loss": 0.7421, "lr": 1.8771826024025944e-05, "epoch": 0.2532467532467532, "percentage": 25.32, "elapsed_time": "0:22:25", "remaining_time": "1:06:08"}
{"current_steps": 40, "total_steps": 154, "loss": 0.4279, "lr": 1.866025403784439e-05, "epoch": 0.2597402597402597, "percentage": 25.97, "elapsed_time": "0:23:00", "remaining_time": "1:05:35"}
{"current_steps": 41, "total_steps": 154, "loss": 0.3088, "lr": 1.8544194045464888e-05, "epoch": 0.2662337662337662, "percentage": 26.62, "elapsed_time": "0:23:33", "remaining_time": "1:04:55"}
{"current_steps": 42, "total_steps": 154, "loss": 0.2931, "lr": 1.8423706192694118e-05, "epoch": 0.2727272727272727, "percentage": 27.27, "elapsed_time": "0:24:07", "remaining_time": "1:04:19"}
{"current_steps": 43, "total_steps": 154, "loss": 0.4912, "lr": 1.8298852919990254e-05, "epoch": 0.2792207792207792, "percentage": 27.92, "elapsed_time": "0:24:41", "remaining_time": "1:03:44"}
{"current_steps": 44, "total_steps": 154, "loss": 0.3692, "lr": 1.816969893010442e-05, "epoch": 0.2857142857142857, "percentage": 28.57, "elapsed_time": "0:25:17", "remaining_time": "1:03:12"}
{"current_steps": 45, "total_steps": 154, "loss": 0.2944, "lr": 1.8036311154549783e-05, "epoch": 0.2922077922077922, "percentage": 29.22, "elapsed_time": "0:25:51", "remaining_time": "1:02:38"}
{"current_steps": 46, "total_steps": 154, "loss": 0.5252, "lr": 1.789875871891559e-05, "epoch": 0.2987012987012987, "percentage": 29.87, "elapsed_time": "0:26:26", "remaining_time": "1:02:03"}
{"current_steps": 47, "total_steps": 154, "loss": 0.5614, "lr": 1.77571129070442e-05, "epoch": 0.3051948051948052, "percentage": 30.52, "elapsed_time": "0:27:00", "remaining_time": "1:01:29"}
{"current_steps": 48, "total_steps": 154, "loss": 0.3101, "lr": 1.761144712408965e-05, "epoch": 0.3116883116883117, "percentage": 31.17, "elapsed_time": "0:27:33", "remaining_time": "1:00:51"}
{"current_steps": 49, "total_steps": 154, "loss": 8.3024, "lr": 1.7461836858476858e-05, "epoch": 0.3181818181818182, "percentage": 31.82, "elapsed_time": "0:28:09", "remaining_time": "1:00:20"}
{"current_steps": 50, "total_steps": 154, "loss": 0.5558, "lr": 1.730835964278124e-05, "epoch": 0.3246753246753247, "percentage": 32.47, "elapsed_time": "0:28:43", "remaining_time": "0:59:44"}
{"current_steps": 51, "total_steps": 154, "loss": 0.5592, "lr": 1.7151095013548996e-05, "epoch": 0.33116883116883117, "percentage": 33.12, "elapsed_time": "0:29:18", "remaining_time": "0:59:12"}
{"current_steps": 52, "total_steps": 154, "loss": 0.3671, "lr": 1.699012447007882e-05, "epoch": 0.33766233766233766, "percentage": 33.77, "elapsed_time": "0:29:54", "remaining_time": "0:58:39"}
{"current_steps": 53, "total_steps": 154, "loss": 0.3092, "lr": 1.6825531432186545e-05, "epoch": 0.34415584415584416, "percentage": 34.42, "elapsed_time": "0:30:29", "remaining_time": "0:58:05"}
{"current_steps": 54, "total_steps": 154, "loss": 0.3291, "lr": 1.6657401196974405e-05, "epoch": 0.35064935064935066, "percentage": 35.06, "elapsed_time": "0:31:03", "remaining_time": "0:57:30"}
{"current_steps": 55, "total_steps": 154, "loss": 0.2884, "lr": 1.648582089462756e-05, "epoch": 0.35714285714285715, "percentage": 35.71, "elapsed_time": "0:31:35", "remaining_time": "0:56:52"}
{"current_steps": 56, "total_steps": 154, "loss": 0.4151, "lr": 1.631087944326053e-05, "epoch": 0.36363636363636365, "percentage": 36.36, "elapsed_time": "0:32:08", "remaining_time": "0:56:14"}
{"current_steps": 57, "total_steps": 154, "loss": 0.4914, "lr": 1.6132667502837164e-05, "epoch": 0.37012987012987014, "percentage": 37.01, "elapsed_time": "0:32:43", "remaining_time": "0:55:41"}
{"current_steps": 58, "total_steps": 154, "loss": 0.3513, "lr": 1.59512774281879e-05, "epoch": 0.37662337662337664, "percentage": 37.66, "elapsed_time": "0:33:18", "remaining_time": "0:55:07"}
{"current_steps": 59, "total_steps": 154, "loss": 0.279, "lr": 1.5766803221148676e-05, "epoch": 0.38311688311688313, "percentage": 38.31, "elapsed_time": "0:33:53", "remaining_time": "0:54:33"}
{"current_steps": 60, "total_steps": 154, "loss": 0.3062, "lr": 1.5579340481846338e-05, "epoch": 0.38961038961038963, "percentage": 38.96, "elapsed_time": "0:34:27", "remaining_time": "0:53:58"}
{"current_steps": 61, "total_steps": 154, "loss": 0.2837, "lr": 1.538898635915576e-05, "epoch": 0.3961038961038961, "percentage": 39.61, "elapsed_time": "0:34:59", "remaining_time": "0:53:20"}
{"current_steps": 62, "total_steps": 154, "loss": 0.3502, "lr": 1.5195839500354337e-05, "epoch": 0.4025974025974026, "percentage": 40.26, "elapsed_time": "0:35:34", "remaining_time": "0:52:47"}
{"current_steps": 63, "total_steps": 154, "loss": 0.3433, "lr": 1.5000000000000002e-05, "epoch": 0.4090909090909091, "percentage": 40.91, "elapsed_time": "0:36:06", "remaining_time": "0:52:09"}
{"current_steps": 64, "total_steps": 154, "loss": 0.3237, "lr": 1.4801569348059158e-05, "epoch": 0.4155844155844156, "percentage": 41.56, "elapsed_time": "0:36:41", "remaining_time": "0:51:36"}
{"current_steps": 65, "total_steps": 154, "loss": 0.2881, "lr": 1.4600650377311523e-05, "epoch": 0.42207792207792205, "percentage": 42.21, "elapsed_time": "0:37:14", "remaining_time": "0:50:59"}
{"current_steps": 66, "total_steps": 154, "loss": 0.3027, "lr": 1.4397347210059059e-05, "epoch": 0.42857142857142855, "percentage": 42.86, "elapsed_time": "0:37:48", "remaining_time": "0:50:25"}
{"current_steps": 67, "total_steps": 154, "loss": 0.3013, "lr": 1.4191765204166643e-05, "epoch": 0.43506493506493504, "percentage": 43.51, "elapsed_time": "0:38:23", "remaining_time": "0:49:50"}
{"current_steps": 68, "total_steps": 154, "loss": 0.3018, "lr": 1.3984010898462417e-05, "epoch": 0.44155844155844154, "percentage": 44.16, "elapsed_time": "0:38:56", "remaining_time": "0:49:15"}
{"current_steps": 69, "total_steps": 154, "loss": 0.3391, "lr": 1.3774191957526144e-05, "epoch": 0.44805194805194803, "percentage": 44.81, "elapsed_time": "0:39:31", "remaining_time": "0:48:41"}
{"current_steps": 70, "total_steps": 154, "loss": 0.2963, "lr": 1.356241711589417e-05, "epoch": 0.45454545454545453, "percentage": 45.45, "elapsed_time": "0:40:04", "remaining_time": "0:48:05"}
{"current_steps": 71, "total_steps": 154, "loss": 0.2732, "lr": 1.3348796121709862e-05, "epoch": 0.461038961038961, "percentage": 46.1, "elapsed_time": "0:40:39", "remaining_time": "0:47:31"}
{"current_steps": 72, "total_steps": 154, "loss": 0.3253, "lr": 1.3133439679848824e-05, "epoch": 0.4675324675324675, "percentage": 46.75, "elapsed_time": "0:41:14", "remaining_time": "0:46:58"}
{"current_steps": 73, "total_steps": 154, "loss": 0.2838, "lr": 1.291645939454825e-05, "epoch": 0.474025974025974, "percentage": 47.4, "elapsed_time": "0:41:48", "remaining_time": "0:46:23"}
{"current_steps": 74, "total_steps": 154, "loss": 0.2912, "lr": 1.2697967711570243e-05, "epoch": 0.4805194805194805, "percentage": 48.05, "elapsed_time": "0:42:22", "remaining_time": "0:45:48"}
{"current_steps": 75, "total_steps": 154, "loss": 0.3109, "lr": 1.2478077859929e-05, "epoch": 0.487012987012987, "percentage": 48.7, "elapsed_time": "0:42:56", "remaining_time": "0:45:13"}
{"current_steps": 76, "total_steps": 154, "loss": 0.2769, "lr": 1.2256903793212107e-05, "epoch": 0.4935064935064935, "percentage": 49.35, "elapsed_time": "0:43:31", "remaining_time": "0:44:40"}
{"current_steps": 77, "total_steps": 154, "loss": 0.2776, "lr": 1.2034560130526341e-05, "epoch": 0.5, "percentage": 50.0, "elapsed_time": "0:44:06", "remaining_time": "0:44:06"}
{"current_steps": 78, "total_steps": 154, "loss": 0.259, "lr": 1.1811162097098559e-05, "epoch": 0.5064935064935064, "percentage": 50.65, "elapsed_time": "0:44:39", "remaining_time": "0:43:30"}
{"current_steps": 79, "total_steps": 154, "loss": 0.3168, "lr": 1.1586825464562515e-05, "epoch": 0.512987012987013, "percentage": 51.3, "elapsed_time": "0:45:14", "remaining_time": "0:42:57"}
{"current_steps": 80, "total_steps": 154, "loss": 0.361, "lr": 1.1361666490962468e-05, "epoch": 0.5194805194805194, "percentage": 51.95, "elapsed_time": "0:45:47", "remaining_time": "0:42:21"}
{"current_steps": 81, "total_steps": 154, "loss": 0.3048, "lr": 1.113580186050475e-05, "epoch": 0.525974025974026, "percentage": 52.6, "elapsed_time": "0:46:22", "remaining_time": "0:41:47"}
{"current_steps": 82, "total_steps": 154, "loss": 0.28, "lr": 1.0909348623088472e-05, "epoch": 0.5324675324675324, "percentage": 53.25, "elapsed_time": "0:46:54", "remaining_time": "0:41:11"}
{"current_steps": 83, "total_steps": 154, "loss": 0.2902, "lr": 1.0682424133646712e-05, "epoch": 0.538961038961039, "percentage": 53.9, "elapsed_time": "0:47:29", "remaining_time": "0:40:37"}
{"current_steps": 84, "total_steps": 154, "loss": 0.2765, "lr": 1.0455145991329639e-05, "epoch": 0.5454545454545454, "percentage": 54.55, "elapsed_time": "0:48:03", "remaining_time": "0:40:02"}
{"current_steps": 85, "total_steps": 154, "loss": 0.2785, "lr": 1.0227631978561057e-05, "epoch": 0.551948051948052, "percentage": 55.19, "elapsed_time": "0:48:38", "remaining_time": "0:39:28"}
{"current_steps": 86, "total_steps": 154, "loss": 0.2845, "lr": 1e-05, "epoch": 0.5584415584415584, "percentage": 55.84, "elapsed_time": "0:49:13", "remaining_time": "0:38:55"}
{"current_steps": 87, "total_steps": 154, "loss": 0.2827, "lr": 9.772368021438943e-06, "epoch": 0.564935064935065, "percentage": 56.49, "elapsed_time": "0:49:48", "remaining_time": "0:38:21"}
{"current_steps": 88, "total_steps": 154, "loss": 0.3217, "lr": 9.544854008670366e-06, "epoch": 0.5714285714285714, "percentage": 57.14, "elapsed_time": "0:50:22", "remaining_time": "0:37:46"}
{"current_steps": 89, "total_steps": 154, "loss": 0.292, "lr": 9.317575866353293e-06, "epoch": 0.577922077922078, "percentage": 57.79, "elapsed_time": "0:50:56", "remaining_time": "0:37:12"}
{"current_steps": 90, "total_steps": 154, "loss": 0.3001, "lr": 9.090651376911532e-06, "epoch": 0.5844155844155844, "percentage": 58.44, "elapsed_time": "0:51:27", "remaining_time": "0:36:35"}
{"current_steps": 91, "total_steps": 154, "loss": 0.2886, "lr": 8.86419813949525e-06, "epoch": 0.5909090909090909, "percentage": 59.09, "elapsed_time": "0:52:01", "remaining_time": "0:36:00"}
{"current_steps": 92, "total_steps": 154, "loss": 0.299, "lr": 8.638333509037537e-06, "epoch": 0.5974025974025974, "percentage": 59.74, "elapsed_time": "0:52:34", "remaining_time": "0:35:26"}
{"current_steps": 93, "total_steps": 154, "loss": 0.3178, "lr": 8.413174535437486e-06, "epoch": 0.6038961038961039, "percentage": 60.39, "elapsed_time": "0:53:08", "remaining_time": "0:34:51"}
{"current_steps": 94, "total_steps": 154, "loss": 0.3026, "lr": 8.188837902901441e-06, "epoch": 0.6103896103896104, "percentage": 61.04, "elapsed_time": "0:53:42", "remaining_time": "0:34:17"}
{"current_steps": 95, "total_steps": 154, "loss": 0.3063, "lr": 7.965439869473664e-06, "epoch": 0.6168831168831169, "percentage": 61.69, "elapsed_time": "0:54:16", "remaining_time": "0:33:42"}
{"current_steps": 96, "total_steps": 154, "loss": 0.2861, "lr": 7.743096206787894e-06, "epoch": 0.6233766233766234, "percentage": 62.34, "elapsed_time": "0:54:51", "remaining_time": "0:33:08"}
{"current_steps": 97, "total_steps": 154, "loss": 0.2873, "lr": 7.521922140071003e-06, "epoch": 0.6298701298701299, "percentage": 62.99, "elapsed_time": "0:55:26", "remaining_time": "0:32:35"}
{"current_steps": 98, "total_steps": 154, "loss": 0.2772, "lr": 7.3020322884297565e-06, "epoch": 0.6363636363636364, "percentage": 63.64, "elapsed_time": "0:55:59", "remaining_time": "0:31:59"}
{"current_steps": 99, "total_steps": 154, "loss": 0.2954, "lr": 7.0835406054517505e-06, "epoch": 0.6428571428571429, "percentage": 64.29, "elapsed_time": "0:56:33", "remaining_time": "0:31:25"}
{"current_steps": 100, "total_steps": 154, "loss": 0.2928, "lr": 6.866560320151179e-06, "epoch": 0.6493506493506493, "percentage": 64.94, "elapsed_time": "0:57:07", "remaining_time": "0:30:51"}
{"current_steps": 101, "total_steps": 154, "loss": 0.2747, "lr": 6.651203878290139e-06, "epoch": 0.6558441558441559, "percentage": 65.58, "elapsed_time": "0:57:43", "remaining_time": "0:30:17"}
{"current_steps": 102, "total_steps": 154, "loss": 0.2796, "lr": 6.437582884105835e-06, "epoch": 0.6623376623376623, "percentage": 66.23, "elapsed_time": "0:58:17", "remaining_time": "0:29:43"}
{"current_steps": 103, "total_steps": 154, "loss": 0.2645, "lr": 6.225808042473857e-06, "epoch": 0.6688311688311688, "percentage": 66.88, "elapsed_time": "0:58:52", "remaining_time": "0:29:09"}
{"current_steps": 104, "total_steps": 154, "loss": 0.2813, "lr": 6.015989101537586e-06, "epoch": 0.6753246753246753, "percentage": 67.53, "elapsed_time": "0:59:26", "remaining_time": "0:28:34"}
{"current_steps": 105, "total_steps": 154, "loss": 0.2801, "lr": 5.8082347958333625e-06, "epoch": 0.6818181818181818, "percentage": 68.18, "elapsed_time": "1:00:00", "remaining_time": "0:28:00"}
{"current_steps": 106, "total_steps": 154, "loss": 0.2814, "lr": 5.602652789940941e-06, "epoch": 0.6883116883116883, "percentage": 68.83, "elapsed_time": "1:00:35", "remaining_time": "0:27:26"}
{"current_steps": 107, "total_steps": 154, "loss": 0.2771, "lr": 5.399349622688479e-06, "epoch": 0.6948051948051948, "percentage": 69.48, "elapsed_time": "1:01:09", "remaining_time": "0:26:51"}
{"current_steps": 108, "total_steps": 154, "loss": 0.3031, "lr": 5.198430651940846e-06, "epoch": 0.7012987012987013, "percentage": 70.13, "elapsed_time": "1:01:43", "remaining_time": "0:26:17"}
{"current_steps": 109, "total_steps": 154, "loss": 0.3317, "lr": 5.000000000000003e-06, "epoch": 0.7077922077922078, "percentage": 70.78, "elapsed_time": "1:02:17", "remaining_time": "0:25:42"}
{"current_steps": 110, "total_steps": 154, "loss": 0.284, "lr": 4.804160499645667e-06, "epoch": 0.7142857142857143, "percentage": 71.43, "elapsed_time": "1:02:51", "remaining_time": "0:25:08"}
{"current_steps": 111, "total_steps": 154, "loss": 0.2656, "lr": 4.611013640844245e-06, "epoch": 0.7207792207792207, "percentage": 72.08, "elapsed_time": "1:03:25", "remaining_time": "0:24:34"}
{"current_steps": 112, "total_steps": 154, "loss": 0.2952, "lr": 4.420659518153667e-06, "epoch": 0.7272727272727273, "percentage": 72.73, "elapsed_time": "1:04:00", "remaining_time": "0:24:00"}
{"current_steps": 113, "total_steps": 154, "loss": 0.2894, "lr": 4.2331967788513295e-06, "epoch": 0.7337662337662337, "percentage": 73.38, "elapsed_time": "1:04:33", "remaining_time": "0:23:25"}
{"current_steps": 114, "total_steps": 154, "loss": 0.2943, "lr": 4.048722571812105e-06, "epoch": 0.7402597402597403, "percentage": 74.03, "elapsed_time": "1:05:06", "remaining_time": "0:22:50"}
{"current_steps": 115, "total_steps": 154, "loss": 0.2717, "lr": 3.867332497162836e-06, "epoch": 0.7467532467532467, "percentage": 74.68, "elapsed_time": "1:05:41", "remaining_time": "0:22:16"}
{"current_steps": 116, "total_steps": 154, "loss": 0.2675, "lr": 3.689120556739475e-06, "epoch": 0.7532467532467533, "percentage": 75.32, "elapsed_time": "1:06:14", "remaining_time": "0:21:41"}
{"current_steps": 117, "total_steps": 154, "loss": 0.2891, "lr": 3.5141791053724405e-06, "epoch": 0.7597402597402597, "percentage": 75.97, "elapsed_time": "1:06:47", "remaining_time": "0:21:07"}
{"current_steps": 118, "total_steps": 154, "loss": 0.2742, "lr": 3.342598803025595e-06, "epoch": 0.7662337662337663, "percentage": 76.62, "elapsed_time": "1:07:21", "remaining_time": "0:20:32"}
{"current_steps": 119, "total_steps": 154, "loss": 0.2828, "lr": 3.174468567813461e-06, "epoch": 0.7727272727272727, "percentage": 77.27, "elapsed_time": "1:07:56", "remaining_time": "0:19:58"}
{"current_steps": 120, "total_steps": 154, "loss": 0.2702, "lr": 3.009875529921181e-06, "epoch": 0.7792207792207793, "percentage": 77.92, "elapsed_time": "1:08:31", "remaining_time": "0:19:24"}
{"current_steps": 121, "total_steps": 154, "loss": 0.2843, "lr": 2.8489049864510053e-06, "epoch": 0.7857142857142857, "percentage": 78.57, "elapsed_time": "1:09:05", "remaining_time": "0:18:50"}
{"current_steps": 122, "total_steps": 154, "loss": 0.2767, "lr": 2.691640357218759e-06, "epoch": 0.7922077922077922, "percentage": 79.22, "elapsed_time": "1:09:40", "remaining_time": "0:18:16"}
{"current_steps": 123, "total_steps": 154, "loss": 0.2646, "lr": 2.5381631415231455e-06, "epoch": 0.7987012987012987, "percentage": 79.87, "elapsed_time": "1:10:14", "remaining_time": "0:17:42"}
{"current_steps": 124, "total_steps": 154, "loss": 0.2922, "lr": 2.388552875910354e-06, "epoch": 0.8051948051948052, "percentage": 80.52, "elapsed_time": "1:10:49", "remaining_time": "0:17:08"}
{"current_steps": 125, "total_steps": 154, "loss": 0.2836, "lr": 2.2428870929558012e-06, "epoch": 0.8116883116883117, "percentage": 81.17, "elapsed_time": "1:11:23", "remaining_time": "0:16:33"}
{"current_steps": 126, "total_steps": 154, "loss": 0.2809, "lr": 2.101241281084416e-06, "epoch": 0.8181818181818182, "percentage": 81.82, "elapsed_time": "1:11:59", "remaining_time": "0:15:59"}
{"current_steps": 127, "total_steps": 154, "loss": 0.2745, "lr": 1.963688845450218e-06, "epoch": 0.8246753246753247, "percentage": 82.47, "elapsed_time": "1:12:34", "remaining_time": "0:15:25"}
{"current_steps": 128, "total_steps": 154, "loss": 0.2933, "lr": 1.8303010698955803e-06, "epoch": 0.8311688311688312, "percentage": 83.12, "elapsed_time": "1:13:07", "remaining_time": "0:14:51"}
{"current_steps": 129, "total_steps": 154, "loss": 0.279, "lr": 1.7011470800097496e-06, "epoch": 0.8376623376623377, "percentage": 83.77, "elapsed_time": "1:13:41", "remaining_time": "0:14:16"}
{"current_steps": 130, "total_steps": 154, "loss": 0.2927, "lr": 1.5762938073058853e-06, "epoch": 0.8441558441558441, "percentage": 84.42, "elapsed_time": "1:14:17", "remaining_time": "0:13:42"}
{"current_steps": 131, "total_steps": 154, "loss": 0.2723, "lr": 1.4558059545351144e-06, "epoch": 0.8506493506493507, "percentage": 85.06, "elapsed_time": "1:14:50", "remaining_time": "0:13:08"}
{"current_steps": 132, "total_steps": 154, "loss": 0.2787, "lr": 1.339745962155613e-06, "epoch": 0.8571428571428571, "percentage": 85.71, "elapsed_time": "1:15:25", "remaining_time": "0:12:34"}
{"current_steps": 133, "total_steps": 154, "loss": 0.2775, "lr": 1.2281739759740575e-06, "epoch": 0.8636363636363636, "percentage": 86.36, "elapsed_time": "1:15:59", "remaining_time": "0:11:59"}
{"current_steps": 134, "total_steps": 154, "loss": 0.2818, "lr": 1.121147815976248e-06, "epoch": 0.8701298701298701, "percentage": 87.01, "elapsed_time": "1:16:33", "remaining_time": "0:11:25"}
{"current_steps": 135, "total_steps": 154, "loss": 0.2704, "lr": 1.01872294636304e-06, "epoch": 0.8766233766233766, "percentage": 87.66, "elapsed_time": "1:17:08", "remaining_time": "0:10:51"}
{"current_steps": 136, "total_steps": 154, "loss": 0.2765, "lr": 9.209524468071096e-07, "epoch": 0.8831168831168831, "percentage": 88.31, "elapsed_time": "1:17:42", "remaining_time": "0:10:17"}
{"current_steps": 137, "total_steps": 154, "loss": 0.2752, "lr": 8.278869849454718e-07, "epoch": 0.8896103896103896, "percentage": 88.96, "elapsed_time": "1:18:17", "remaining_time": "0:09:42"}
{"current_steps": 138, "total_steps": 154, "loss": 0.2721, "lr": 7.395747901219474e-07, "epoch": 0.8961038961038961, "percentage": 89.61, "elapsed_time": "1:18:52", "remaining_time": "0:09:08"}
{"current_steps": 139, "total_steps": 154, "loss": 0.2666, "lr": 6.560616283932897e-07, "epoch": 0.9025974025974026, "percentage": 90.26, "elapsed_time": "1:19:26", "remaining_time": "0:08:34"}
{"current_steps": 140, "total_steps": 154, "loss": 0.279, "lr": 5.77390778811796e-07, "epoch": 0.9090909090909091, "percentage": 90.91, "elapsed_time": "1:20:01", "remaining_time": "0:08:00"}
{"current_steps": 141, "total_steps": 154, "loss": 0.2798, "lr": 5.036030109968082e-07, "epoch": 0.9155844155844156, "percentage": 91.56, "elapsed_time": "1:20:35", "remaining_time": "0:07:25"}
{"current_steps": 142, "total_steps": 154, "loss": 0.2697, "lr": 4.3473656400665256e-07, "epoch": 0.922077922077922, "percentage": 92.21, "elapsed_time": "1:21:10", "remaining_time": "0:06:51"}
{"current_steps": 143, "total_steps": 154, "loss": 0.2745, "lr": 3.708271265220087e-07, "epoch": 0.9285714285714286, "percentage": 92.86, "elapsed_time": "1:21:45", "remaining_time": "0:06:17"}
{"current_steps": 144, "total_steps": 154, "loss": 0.2682, "lr": 3.119078183509372e-07, "epoch": 0.935064935064935, "percentage": 93.51, "elapsed_time": "1:22:21", "remaining_time": "0:05:43"}
{"current_steps": 145, "total_steps": 154, "loss": 0.2781, "lr": 2.5800917326521013e-07, "epoch": 0.9415584415584416, "percentage": 94.16, "elapsed_time": "1:22:54", "remaining_time": "0:05:08"}
{"current_steps": 146, "total_steps": 154, "loss": 0.2708, "lr": 2.091591231767709e-07, "epoch": 0.948051948051948, "percentage": 94.81, "elapsed_time": "1:23:27", "remaining_time": "0:04:34"}
{"current_steps": 147, "total_steps": 154, "loss": 0.2666, "lr": 1.6538298366257975e-07, "epoch": 0.9545454545454546, "percentage": 95.45, "elapsed_time": "1:24:00", "remaining_time": "0:04:00"}
{"current_steps": 148, "total_steps": 154, "loss": 0.2809, "lr": 1.2670344084530384e-07, "epoch": 0.961038961038961, "percentage": 96.1, "elapsed_time": "1:24:37", "remaining_time": "0:03:25"}
{"current_steps": 149, "total_steps": 154, "loss": 0.2679, "lr": 9.314053963669245e-08, "epoch": 0.9675324675324676, "percentage": 96.75, "elapsed_time": "1:25:12", "remaining_time": "0:02:51"}
{"current_steps": 150, "total_steps": 154, "loss": 0.2691, "lr": 6.471167334968887e-08, "epoch": 0.974025974025974, "percentage": 97.4, "elapsed_time": "1:25:45", "remaining_time": "0:02:17"}
{"current_steps": 151, "total_steps": 154, "loss": 0.276, "lr": 4.143157468468717e-08, "epoch": 0.9805194805194806, "percentage": 98.05, "elapsed_time": "1:26:20", "remaining_time": "0:01:42"}
{"current_steps": 152, "total_steps": 154, "loss": 0.2796, "lr": 2.3312308094607382e-08, "epoch": 0.987012987012987, "percentage": 98.7, "elapsed_time": "1:26:54", "remaining_time": "0:01:08"}
{"current_steps": 153, "total_steps": 154, "loss": 0.2645, "lr": 1.0363263532724433e-08, "epoch": 0.9935064935064936, "percentage": 99.35, "elapsed_time": "1:27:29", "remaining_time": "0:00:34"}
{"current_steps": 154, "total_steps": 154, "loss": 0.2856, "lr": 2.591151586508467e-09, "epoch": 1.0, "percentage": 100.0, "elapsed_time": "1:28:03", "remaining_time": "0:00:00"}
{"current_steps": 154, "total_steps": 154, "epoch": 1.0, "percentage": 100.0, "elapsed_time": "1:28:37", "remaining_time": "0:00:00"}