|
{ |
|
"best_metric": 0.9135991932046025, |
|
"best_model_checkpoint": "../models/eusts/checkpoint-2180", |
|
"epoch": 10.0, |
|
"global_step": 2180, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"learning_rate": 2.8726207906295755e-05, |
|
"loss": 1.4053, |
|
"step": 218 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_combined_score": 0.8498445305588846, |
|
"eval_loss": 0.5913795232772827, |
|
"eval_pearson": 0.8576485507627736, |
|
"eval_runtime": 10.4654, |
|
"eval_samples_per_second": 83.227, |
|
"eval_spearmanr": 0.8420405103549957, |
|
"eval_steps_per_second": 10.415, |
|
"step": 218 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"learning_rate": 2.553440702781845e-05, |
|
"loss": 0.3881, |
|
"step": 436 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_combined_score": 0.887035736675172, |
|
"eval_loss": 0.447421669960022, |
|
"eval_pearson": 0.8917341241804541, |
|
"eval_runtime": 10.5067, |
|
"eval_samples_per_second": 82.899, |
|
"eval_spearmanr": 0.8823373491698899, |
|
"eval_steps_per_second": 10.374, |
|
"step": 436 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"learning_rate": 2.2342606149341143e-05, |
|
"loss": 0.2083, |
|
"step": 654 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_combined_score": 0.8970108216951012, |
|
"eval_loss": 0.4096603989601135, |
|
"eval_pearson": 0.9016467997316473, |
|
"eval_runtime": 10.4817, |
|
"eval_samples_per_second": 83.097, |
|
"eval_spearmanr": 0.8923748436585551, |
|
"eval_steps_per_second": 10.399, |
|
"step": 654 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"learning_rate": 1.9150805270863837e-05, |
|
"loss": 0.1393, |
|
"step": 872 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_combined_score": 0.9009673665742599, |
|
"eval_loss": 0.3968064486980438, |
|
"eval_pearson": 0.9046095606853766, |
|
"eval_runtime": 10.448, |
|
"eval_samples_per_second": 83.366, |
|
"eval_spearmanr": 0.8973251724631434, |
|
"eval_steps_per_second": 10.433, |
|
"step": 872 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"learning_rate": 1.595900439238653e-05, |
|
"loss": 0.1023, |
|
"step": 1090 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_combined_score": 0.906389648678596, |
|
"eval_loss": 0.38093939423561096, |
|
"eval_pearson": 0.9095917410726173, |
|
"eval_runtime": 10.7338, |
|
"eval_samples_per_second": 81.146, |
|
"eval_spearmanr": 0.9031875562845746, |
|
"eval_steps_per_second": 10.155, |
|
"step": 1090 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"learning_rate": 1.2767203513909225e-05, |
|
"loss": 0.0841, |
|
"step": 1308 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_combined_score": 0.9098955778506463, |
|
"eval_loss": 0.37849491834640503, |
|
"eval_pearson": 0.9139073667065271, |
|
"eval_runtime": 10.6077, |
|
"eval_samples_per_second": 82.11, |
|
"eval_spearmanr": 0.9058837889947655, |
|
"eval_steps_per_second": 10.276, |
|
"step": 1308 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"learning_rate": 9.575402635431918e-06, |
|
"loss": 0.0664, |
|
"step": 1526 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_combined_score": 0.9111955743924036, |
|
"eval_loss": 0.35929641127586365, |
|
"eval_pearson": 0.9148956072886006, |
|
"eval_runtime": 10.7134, |
|
"eval_samples_per_second": 81.3, |
|
"eval_spearmanr": 0.9074955414962067, |
|
"eval_steps_per_second": 10.174, |
|
"step": 1526 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"learning_rate": 6.383601756954612e-06, |
|
"loss": 0.057, |
|
"step": 1744 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_combined_score": 0.9122781067251765, |
|
"eval_loss": 0.3573194146156311, |
|
"eval_pearson": 0.9160432969800479, |
|
"eval_runtime": 10.694, |
|
"eval_samples_per_second": 81.448, |
|
"eval_spearmanr": 0.9085129164703051, |
|
"eval_steps_per_second": 10.193, |
|
"step": 1744 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"learning_rate": 3.191800878477306e-06, |
|
"loss": 0.0485, |
|
"step": 1962 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_combined_score": 0.9128873266818468, |
|
"eval_loss": 0.3531445860862732, |
|
"eval_pearson": 0.9165594039106797, |
|
"eval_runtime": 10.7576, |
|
"eval_samples_per_second": 80.966, |
|
"eval_spearmanr": 0.9092152494530139, |
|
"eval_steps_per_second": 10.132, |
|
"step": 1962 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"learning_rate": 0.0, |
|
"loss": 0.0449, |
|
"step": 2180 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_combined_score": 0.9135991932046025, |
|
"eval_loss": 0.3487534821033478, |
|
"eval_pearson": 0.917271052630473, |
|
"eval_runtime": 10.8295, |
|
"eval_samples_per_second": 80.428, |
|
"eval_spearmanr": 0.9099273337787319, |
|
"eval_steps_per_second": 10.065, |
|
"step": 2180 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"step": 2180, |
|
"total_flos": 1.834393807540224e+16, |
|
"train_loss": 0.2544048738042149, |
|
"train_runtime": 2592.0512, |
|
"train_samples_per_second": 26.898, |
|
"train_steps_per_second": 0.841 |
|
} |
|
], |
|
"max_steps": 2180, |
|
"num_train_epochs": 10, |
|
"total_flos": 1.834393807540224e+16, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|