{"epoch": 19.0, "global_step": 1653, "max_steps": 1740, "logging_steps": 50, "eval_steps": 50, "save_steps": 50, "train_batch_size": 2, "num_train_epochs": 20, "num_input_tokens_seen": 0, "total_flos": 3.04327780466688e+17, "log_history": [{"loss": 1.4461, "grad_norm": 0.629298746585846, "learning_rate": 2.4390243902439023e-06, "epoch": 18.39080459770115, "step": 1600}, {"eval_loss": 1.472578525543213, "eval_runtime": 1.1085, "eval_samples_per_second": 8.119, "eval_steps_per_second": 2.706, "epoch": 18.39080459770115, "step": 1600}, {"loss": 1.4669, "grad_norm": 0.6036643385887146, "learning_rate": 1.5679442508710803e-06, "epoch": 18.96551724137931, "step": 1650}, {"eval_loss": 1.4724897146224976, "eval_runtime": 1.0953, "eval_samples_per_second": 8.217, "eval_steps_per_second": 2.739, "epoch": 18.96551724137931, "step": 1650}], "best_metric": 1.4655534029006958, "best_model_checkpoint": "./pf-data-use-unsloth-phi-3.5-simpleschema-thinking-prwp-manual-914-train-20epochs-1738770532/checkpoint-1250", "is_local_process_zero": true, "is_world_process_zero": true, "is_hyper_param_search": false, "trial_name": null, "trial_params": null, "stateful_callbacks": {"TrainerControl": {"args": {"should_training_stop": false, "should_epoch_stop": false, "should_save": true, "should_evaluate": false, "should_log": false}, "attributes": {}}}} (Trained with Unsloth)
verified