amnraw's picture
End of training
89413ec verified
raw
history blame
2.67 kB
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 2.0,
"eval_steps": 500,
"global_step": 200,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"grad_norm": 349.9459228515625,
"learning_rate": 1e-05,
"loss": 34.1337,
"step": 100
},
{
"epoch": 1.0,
"eval_loss": 32.34307861328125,
"eval_map": 0.1958,
"eval_map_50": 0.3913,
"eval_map_75": 0.181,
"eval_map_car": 0.2673,
"eval_map_large": 0.7775,
"eval_map_medium": 0.6051,
"eval_map_person": 0.1243,
"eval_map_small": 0.1319,
"eval_mar_1": 0.0924,
"eval_mar_10": 0.2465,
"eval_mar_100": 0.2845,
"eval_mar_100_car": 0.3689,
"eval_mar_100_person": 0.2001,
"eval_mar_large": 0.8587,
"eval_mar_medium": 0.7094,
"eval_mar_small": 0.2104,
"eval_runtime": 74.5282,
"eval_samples_per_second": 4.428,
"eval_steps_per_second": 0.564,
"step": 100
},
{
"epoch": 2.0,
"grad_norm": 296.57305908203125,
"learning_rate": 1e-05,
"loss": 28.4514,
"step": 200
},
{
"epoch": 2.0,
"eval_loss": 30.562538146972656,
"eval_map": 0.2089,
"eval_map_50": 0.4081,
"eval_map_75": 0.1963,
"eval_map_car": 0.2797,
"eval_map_large": 0.8115,
"eval_map_medium": 0.6277,
"eval_map_person": 0.1381,
"eval_map_small": 0.1412,
"eval_mar_1": 0.0944,
"eval_mar_10": 0.25,
"eval_mar_100": 0.2879,
"eval_mar_100_car": 0.3722,
"eval_mar_100_person": 0.2036,
"eval_mar_large": 0.8531,
"eval_mar_medium": 0.7147,
"eval_mar_small": 0.2137,
"eval_runtime": 73.4438,
"eval_samples_per_second": 4.493,
"eval_steps_per_second": 0.572,
"step": 200
},
{
"epoch": 2.0,
"step": 200,
"total_flos": 1.787388644818944e+17,
"train_loss": 31.292569580078126,
"train_runtime": 355.6302,
"train_samples_per_second": 8.998,
"train_steps_per_second": 0.562
}
],
"logging_steps": 500,
"max_steps": 200,
"num_input_tokens_seen": 0,
"num_train_epochs": 2,
"save_steps": 500,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 1.787388644818944e+17,
"train_batch_size": 8,
"trial_name": null,
"trial_params": null
}