data-use-unsloth-phi-3.5-simpleschema-thinking-prwp-manual-914-train-20epochs-1738770532-lora
/
special_tokens_map.json

{"epoch": 1.0, "global_step": 87, "max_steps": 1740, "logging_steps": 50, "eval_steps": 50, "save_steps": 50, "train_batch_size": 2, "num_train_epochs": 20, "num_input_tokens_seen": 0, "total_flos": 9222053953536000.0, "log_history": [{"loss": 4.3402, "grad_norm": 0.8734406232833862, "learning_rate": 2.9442508710801396e-05, "epoch": 0.5747126436781609, "step": 50}, {"eval_loss": 3.7241973876953125, "eval_runtime": 1.118, "eval_samples_per_second": 8.05, "eval_steps_per_second": 2.683, "epoch": 0.5747126436781609, "step": 50}], "best_metric": 3.7241973876953125, "best_model_checkpoint": "./pf-data-use-unsloth-phi-3.5-simpleschema-thinking-prwp-manual-914-train-20epochs-1738770532/checkpoint-50", "is_local_process_zero": true, "is_world_process_zero": true, "is_hyper_param_search": false, "trial_name": null, "trial_params": null, "stateful_callbacks": {"TrainerControl": {"args": {"should_training_stop": false, "should_epoch_stop": false, "should_save": true, "should_evaluate": false, "should_log": false}, "attributes": {}}}} (Trained with Unsloth)
5051da4
verified
{ | |
"bos_token": { | |
"content": "<s>", | |
"lstrip": false, | |
"normalized": false, | |
"rstrip": false, | |
"single_word": false | |
}, | |
"eos_token": { | |
"content": "<|endoftext|>", | |
"lstrip": false, | |
"normalized": false, | |
"rstrip": false, | |
"single_word": false | |
}, | |
"pad_token": { | |
"content": "<|placeholder6|>", | |
"lstrip": false, | |
"normalized": false, | |
"rstrip": true, | |
"single_word": false | |
}, | |
"unk_token": { | |
"content": "<unk>", | |
"lstrip": false, | |
"normalized": false, | |
"rstrip": false, | |
"single_word": false | |
} | |
} | |