|
{ |
|
"best_metric": 3.1014273166656494, |
|
"best_model_checkpoint": "../Modelos/bloomz_AEx_SQUAD 16-11-22_14:58:43/checkpoint-1000", |
|
"epoch": 1.0787327266599258, |
|
"global_step": 1000, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.05, |
|
"eval_loss": 5.220151424407959, |
|
"eval_runtime": 62.5146, |
|
"eval_samples_per_second": 109.095, |
|
"eval_steps_per_second": 27.274, |
|
"step": 50 |
|
}, |
|
{ |
|
"epoch": 0.11, |
|
"eval_loss": 4.333649158477783, |
|
"eval_runtime": 62.5129, |
|
"eval_samples_per_second": 109.097, |
|
"eval_steps_per_second": 27.274, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 0.16, |
|
"eval_loss": 3.8862874507904053, |
|
"eval_runtime": 62.5283, |
|
"eval_samples_per_second": 109.071, |
|
"eval_steps_per_second": 27.268, |
|
"step": 150 |
|
}, |
|
{ |
|
"epoch": 0.22, |
|
"eval_loss": 3.6269617080688477, |
|
"eval_runtime": 62.5217, |
|
"eval_samples_per_second": 109.082, |
|
"eval_steps_per_second": 27.271, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 0.27, |
|
"eval_loss": 3.50032639503479, |
|
"eval_runtime": 62.5086, |
|
"eval_samples_per_second": 109.105, |
|
"eval_steps_per_second": 27.276, |
|
"step": 250 |
|
}, |
|
{ |
|
"epoch": 0.32, |
|
"eval_loss": 3.3939645290374756, |
|
"eval_runtime": 62.5177, |
|
"eval_samples_per_second": 109.089, |
|
"eval_steps_per_second": 27.272, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 0.38, |
|
"eval_loss": 3.3134140968322754, |
|
"eval_runtime": 62.5154, |
|
"eval_samples_per_second": 109.093, |
|
"eval_steps_per_second": 27.273, |
|
"step": 350 |
|
}, |
|
{ |
|
"epoch": 0.43, |
|
"eval_loss": 3.228942394256592, |
|
"eval_runtime": 62.5039, |
|
"eval_samples_per_second": 109.113, |
|
"eval_steps_per_second": 27.278, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 0.49, |
|
"eval_loss": 3.2036657333374023, |
|
"eval_runtime": 62.5162, |
|
"eval_samples_per_second": 109.092, |
|
"eval_steps_per_second": 27.273, |
|
"step": 450 |
|
}, |
|
{ |
|
"epoch": 0.54, |
|
"learning_rate": 4.108234448040274e-05, |
|
"loss": 3.8523, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 0.54, |
|
"eval_loss": 3.1620962619781494, |
|
"eval_runtime": 62.5012, |
|
"eval_samples_per_second": 109.118, |
|
"eval_steps_per_second": 27.279, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 0.59, |
|
"eval_loss": 3.128020763397217, |
|
"eval_runtime": 62.5236, |
|
"eval_samples_per_second": 109.079, |
|
"eval_steps_per_second": 27.27, |
|
"step": 550 |
|
}, |
|
{ |
|
"epoch": 0.65, |
|
"eval_loss": 3.0899899005889893, |
|
"eval_runtime": 62.5266, |
|
"eval_samples_per_second": 109.074, |
|
"eval_steps_per_second": 27.268, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 0.7, |
|
"eval_loss": 3.073817729949951, |
|
"eval_runtime": 62.5093, |
|
"eval_samples_per_second": 109.104, |
|
"eval_steps_per_second": 27.276, |
|
"step": 650 |
|
}, |
|
{ |
|
"epoch": 0.75, |
|
"eval_loss": 3.0438177585601807, |
|
"eval_runtime": 62.5327, |
|
"eval_samples_per_second": 109.063, |
|
"eval_steps_per_second": 27.266, |
|
"step": 700 |
|
}, |
|
{ |
|
"epoch": 0.81, |
|
"eval_loss": 3.0443129539489746, |
|
"eval_runtime": 62.5242, |
|
"eval_samples_per_second": 109.078, |
|
"eval_steps_per_second": 27.269, |
|
"step": 750 |
|
}, |
|
{ |
|
"epoch": 0.86, |
|
"eval_loss": 3.044921636581421, |
|
"eval_runtime": 62.5248, |
|
"eval_samples_per_second": 109.077, |
|
"eval_steps_per_second": 27.269, |
|
"step": 800 |
|
}, |
|
{ |
|
"epoch": 0.92, |
|
"eval_loss": 3.0547332763671875, |
|
"eval_runtime": 62.5038, |
|
"eval_samples_per_second": 109.113, |
|
"eval_steps_per_second": 27.278, |
|
"step": 850 |
|
}, |
|
{ |
|
"epoch": 0.97, |
|
"eval_loss": 3.041879415512085, |
|
"eval_runtime": 62.5198, |
|
"eval_samples_per_second": 109.086, |
|
"eval_steps_per_second": 27.271, |
|
"step": 900 |
|
}, |
|
{ |
|
"epoch": 1.02, |
|
"eval_loss": 3.113288640975952, |
|
"eval_runtime": 62.5071, |
|
"eval_samples_per_second": 109.108, |
|
"eval_steps_per_second": 27.277, |
|
"step": 950 |
|
}, |
|
{ |
|
"epoch": 1.08, |
|
"learning_rate": 3.209277238403452e-05, |
|
"loss": 2.4796, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 1.08, |
|
"eval_loss": 3.1014273166656494, |
|
"eval_runtime": 62.5073, |
|
"eval_samples_per_second": 109.107, |
|
"eval_steps_per_second": 27.277, |
|
"step": 1000 |
|
} |
|
], |
|
"max_steps": 2781, |
|
"num_train_epochs": 3, |
|
"total_flos": 4.377761810061722e+16, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|