time_sft_llama3_8b / trainer_log.jsonl
stamina's picture
Upload folder using huggingface_hub
a24198f verified
{"current_steps": 10, "total_steps": 172, "loss": 7.5213, "lr": 1e-05, "epoch": 0.11527377521613832, "percentage": 5.81, "elapsed_time": "0:11:36", "remaining_time": "3:08:05"}
{"current_steps": 20, "total_steps": 172, "loss": 2.6949, "lr": 1.9997919281892066e-05, "epoch": 0.23054755043227665, "percentage": 11.63, "elapsed_time": "0:23:09", "remaining_time": "2:56:02"}
{"current_steps": 30, "total_steps": 172, "loss": 1.2043, "lr": 1.9749279121818235e-05, "epoch": 0.345821325648415, "percentage": 17.44, "elapsed_time": "0:34:44", "remaining_time": "2:44:27"}
{"current_steps": 40, "total_steps": 172, "loss": 0.4223, "lr": 1.9096319953545186e-05, "epoch": 0.4610951008645533, "percentage": 23.26, "elapsed_time": "0:46:14", "remaining_time": "2:32:35"}
{"current_steps": 50, "total_steps": 172, "loss": 0.319, "lr": 1.8066121092375303e-05, "epoch": 0.5763688760806917, "percentage": 29.07, "elapsed_time": "0:57:51", "remaining_time": "2:21:10"}
{"current_steps": 60, "total_steps": 172, "loss": 1.4997, "lr": 1.67014066183756e-05, "epoch": 0.69164265129683, "percentage": 34.88, "elapsed_time": "4:28:38", "remaining_time": "8:21:27"}
{"current_steps": 70, "total_steps": 172, "loss": 0.3865, "lr": 1.5058773536894685e-05, "epoch": 0.8069164265129684, "percentage": 40.7, "elapsed_time": "4:40:12", "remaining_time": "6:48:18"}
{"current_steps": 80, "total_steps": 172, "loss": 0.3256, "lr": 1.3206344605527355e-05, "epoch": 0.9221902017291066, "percentage": 46.51, "elapsed_time": "4:51:51", "remaining_time": "5:35:37"}
{"current_steps": 86, "total_steps": 172, "eval_loss": 0.33376210927963257, "epoch": 0.9913544668587896, "percentage": 50.0, "elapsed_time": "5:02:02", "remaining_time": "5:02:02"}
{"current_steps": 90, "total_steps": 172, "loss": 0.3396, "lr": 1.12209431687416e-05, "epoch": 1.0461095100864553, "percentage": 52.33, "elapsed_time": "5:07:10", "remaining_time": "4:39:52"}
{"current_steps": 100, "total_steps": 172, "loss": 1.0414, "lr": 9.184907164529369e-06, "epoch": 1.1613832853025936, "percentage": 58.14, "elapsed_time": "5:18:40", "remaining_time": "3:49:26"}
{"current_steps": 110, "total_steps": 172, "loss": 0.2945, "lr": 7.182674431585703e-06, "epoch": 1.276657060518732, "percentage": 63.95, "elapsed_time": "5:30:13", "remaining_time": "3:06:07"}
{"current_steps": 120, "total_steps": 172, "loss": 0.2875, "lr": 5.297280930072632e-06, "epoch": 1.3919308357348703, "percentage": 69.77, "elapsed_time": "5:41:49", "remaining_time": "2:28:07"}
{"current_steps": 130, "total_steps": 172, "loss": 0.279, "lr": 3.6069171006444882e-06, "epoch": 1.5072046109510087, "percentage": 75.58, "elapsed_time": "5:53:23", "remaining_time": "1:54:10"}
{"current_steps": 140, "total_steps": 172, "loss": 0.2826, "lr": 2.1816851753197023e-06, "epoch": 1.622478386167147, "percentage": 81.4, "elapsed_time": "6:04:51", "remaining_time": "1:23:23"}
{"current_steps": 150, "total_steps": 172, "loss": 0.2821, "lr": 1.0806919199730614e-06, "epoch": 1.7377521613832854, "percentage": 87.21, "elapsed_time": "6:16:27", "remaining_time": "0:55:12"}
{"current_steps": 160, "total_steps": 172, "loss": 0.2813, "lr": 3.4959737730860144e-07, "epoch": 1.8530259365994235, "percentage": 93.02, "elapsed_time": "6:28:05", "remaining_time": "0:29:06"}
{"current_steps": 170, "total_steps": 172, "loss": 0.2795, "lr": 1.872126806633068e-08, "epoch": 1.968299711815562, "percentage": 98.84, "elapsed_time": "6:39:33", "remaining_time": "0:04:42"}
{"current_steps": 172, "total_steps": 172, "eval_loss": 0.2755764126777649, "epoch": 1.9913544668587897, "percentage": 100.0, "elapsed_time": "6:44:35", "remaining_time": "0:00:00"}
{"current_steps": 172, "total_steps": 172, "epoch": 1.9913544668587897, "percentage": 100.0, "elapsed_time": "6:45:09", "remaining_time": "0:00:00"}