|
{ |
|
"best_metric": 0.05236489325761795, |
|
"best_model_checkpoint": "/content/drive/MyDrive/Colab Notebooks/models/google/flan-t5-small-codesearchnet-python/checkpoint-1500", |
|
"epoch": 12.0, |
|
"global_step": 4500, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"eval_avg_length": 17.029, |
|
"eval_bleu": 0.0364, |
|
"eval_loss": 0.06356053799390793, |
|
"eval_rouge1": 0.6253, |
|
"eval_rouge2": 0.6076, |
|
"eval_runtime": 194.621, |
|
"eval_samples_per_second": 25.691, |
|
"eval_steps_per_second": 3.211, |
|
"step": 375 |
|
}, |
|
{ |
|
"epoch": 1.33, |
|
"learning_rate": 0.006761715281754732, |
|
"loss": 5.5166, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_avg_length": 16.9996, |
|
"eval_bleu": 0.0351, |
|
"eval_loss": 0.05532339960336685, |
|
"eval_rouge1": 0.6259, |
|
"eval_rouge2": 0.6081, |
|
"eval_runtime": 191.1842, |
|
"eval_samples_per_second": 26.153, |
|
"eval_steps_per_second": 3.269, |
|
"step": 750 |
|
}, |
|
{ |
|
"epoch": 2.67, |
|
"learning_rate": 0.013524587266147137, |
|
"loss": 0.0485, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_avg_length": 16.99, |
|
"eval_bleu": 0.0351, |
|
"eval_loss": 0.05369499325752258, |
|
"eval_rouge1": 0.6258, |
|
"eval_rouge2": 0.6083, |
|
"eval_runtime": 189.3124, |
|
"eval_samples_per_second": 26.411, |
|
"eval_steps_per_second": 3.301, |
|
"step": 1125 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"learning_rate": 0.02029060572385788, |
|
"loss": 0.0409, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_avg_length": 16.9942, |
|
"eval_bleu": 0.0351, |
|
"eval_loss": 0.05236489325761795, |
|
"eval_rouge1": 0.6258, |
|
"eval_rouge2": 0.6082, |
|
"eval_runtime": 189.5235, |
|
"eval_samples_per_second": 26.382, |
|
"eval_steps_per_second": 3.298, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_avg_length": 16.997, |
|
"eval_bleu": 0.0351, |
|
"eval_loss": 0.052440039813518524, |
|
"eval_rouge1": 0.6261, |
|
"eval_rouge2": 0.6086, |
|
"eval_runtime": 188.8356, |
|
"eval_samples_per_second": 26.478, |
|
"eval_steps_per_second": 3.31, |
|
"step": 1875 |
|
}, |
|
{ |
|
"epoch": 5.33, |
|
"learning_rate": 0.027062522247433662, |
|
"loss": 0.0345, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_avg_length": 16.9936, |
|
"eval_bleu": 0.0351, |
|
"eval_loss": 0.052636753767728806, |
|
"eval_rouge1": 0.6258, |
|
"eval_rouge2": 0.6081, |
|
"eval_runtime": 188.807, |
|
"eval_samples_per_second": 26.482, |
|
"eval_steps_per_second": 3.31, |
|
"step": 2250 |
|
}, |
|
{ |
|
"epoch": 6.67, |
|
"learning_rate": 0.03384636715054512, |
|
"loss": 0.0303, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_avg_length": 16.991, |
|
"eval_bleu": 0.035, |
|
"eval_loss": 0.0532960519194603, |
|
"eval_rouge1": 0.6254, |
|
"eval_rouge2": 0.6076, |
|
"eval_runtime": 195.9042, |
|
"eval_samples_per_second": 25.523, |
|
"eval_steps_per_second": 3.19, |
|
"step": 2625 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"learning_rate": 0.04064999520778656, |
|
"loss": 0.0256, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_avg_length": 16.9964, |
|
"eval_bleu": 0.035, |
|
"eval_loss": 0.05655151233077049, |
|
"eval_rouge1": 0.6257, |
|
"eval_rouge2": 0.6074, |
|
"eval_runtime": 193.7837, |
|
"eval_samples_per_second": 25.802, |
|
"eval_steps_per_second": 3.225, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_avg_length": 16.998, |
|
"eval_bleu": 0.0349, |
|
"eval_loss": 0.05918492376804352, |
|
"eval_rouge1": 0.6253, |
|
"eval_rouge2": 0.6074, |
|
"eval_runtime": 190.3532, |
|
"eval_samples_per_second": 26.267, |
|
"eval_steps_per_second": 3.283, |
|
"step": 3375 |
|
}, |
|
{ |
|
"epoch": 9.33, |
|
"learning_rate": 0.047494322061538696, |
|
"loss": 0.0205, |
|
"step": 3500 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_avg_length": 16.9932, |
|
"eval_bleu": 0.0351, |
|
"eval_loss": 0.06117509678006172, |
|
"eval_rouge1": 0.6255, |
|
"eval_rouge2": 0.6073, |
|
"eval_runtime": 197.2772, |
|
"eval_samples_per_second": 25.345, |
|
"eval_steps_per_second": 3.168, |
|
"step": 3750 |
|
}, |
|
{ |
|
"epoch": 10.67, |
|
"learning_rate": 0.054379865527153015, |
|
"loss": 0.0185, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"eval_avg_length": 16.996, |
|
"eval_bleu": 0.035, |
|
"eval_loss": 0.06389027088880539, |
|
"eval_rouge1": 0.6257, |
|
"eval_rouge2": 0.6079, |
|
"eval_runtime": 194.6757, |
|
"eval_samples_per_second": 25.684, |
|
"eval_steps_per_second": 3.21, |
|
"step": 4125 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"learning_rate": 0.0613127239048481, |
|
"loss": 0.0157, |
|
"step": 4500 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"eval_avg_length": 16.9944, |
|
"eval_bleu": 0.035, |
|
"eval_loss": 0.06984004378318787, |
|
"eval_rouge1": 0.625, |
|
"eval_rouge2": 0.6064, |
|
"eval_runtime": 196.3811, |
|
"eval_samples_per_second": 25.461, |
|
"eval_steps_per_second": 3.183, |
|
"step": 4500 |
|
} |
|
], |
|
"max_steps": 5625, |
|
"num_train_epochs": 15, |
|
"total_flos": 3.346029084672e+16, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|