ucf101_videomae-base / trainer_state.json
jialicheng's picture
Upload folder using huggingface_hub
8b75f28 verified
{
"best_metric": 0.8297674418604651,
"best_model_checkpoint": "video/train/checkpoint/videomae-base/ucf101_42/checkpoint-5700",
"epoch": 19.871751886001675,
"eval_steps": 500,
"global_step": 5960,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.01,
"eval_accuracy": 0.4886511627906977,
"eval_loss": 2.334453582763672,
"eval_runtime": 390.4063,
"eval_samples_per_second": 9.69,
"eval_steps_per_second": 0.154,
"step": 300
},
{
"epoch": 2.01,
"eval_accuracy": 0.6433488372093024,
"eval_loss": 1.4956246614456177,
"eval_runtime": 378.3625,
"eval_samples_per_second": 9.998,
"eval_steps_per_second": 0.159,
"step": 600
},
{
"epoch": 3.01,
"eval_accuracy": 0.7161860465116279,
"eval_loss": 1.1646597385406494,
"eval_runtime": 374.5393,
"eval_samples_per_second": 10.1,
"eval_steps_per_second": 0.16,
"step": 900
},
{
"epoch": 3.34,
"grad_norm": 6.9290690422058105,
"learning_rate": 4.161073825503356e-05,
"loss": 1.5784,
"step": 1000
},
{
"epoch": 4.01,
"eval_accuracy": 0.7028837209302325,
"eval_loss": 1.1531013250350952,
"eval_runtime": 376.3709,
"eval_samples_per_second": 10.051,
"eval_steps_per_second": 0.159,
"step": 1200
},
{
"epoch": 5.01,
"eval_accuracy": 0.7333953488372092,
"eval_loss": 1.0251258611679077,
"eval_runtime": 377.2789,
"eval_samples_per_second": 10.027,
"eval_steps_per_second": 0.159,
"step": 1500
},
{
"epoch": 6.01,
"eval_accuracy": 0.7333023255813953,
"eval_loss": 1.031457781791687,
"eval_runtime": 376.6891,
"eval_samples_per_second": 10.043,
"eval_steps_per_second": 0.159,
"step": 1800
},
{
"epoch": 6.67,
"grad_norm": 7.911869049072266,
"learning_rate": 3.3221476510067115e-05,
"loss": 0.1821,
"step": 2000
},
{
"epoch": 7.01,
"eval_accuracy": 0.7616744186046511,
"eval_loss": 0.9787126779556274,
"eval_runtime": 379.965,
"eval_samples_per_second": 9.956,
"eval_steps_per_second": 0.158,
"step": 2100
},
{
"epoch": 8.01,
"eval_accuracy": 0.7838139534883721,
"eval_loss": 0.8932655453681946,
"eval_runtime": 375.8521,
"eval_samples_per_second": 10.065,
"eval_steps_per_second": 0.16,
"step": 2400
},
{
"epoch": 9.01,
"eval_accuracy": 0.7917209302325582,
"eval_loss": 0.8780561089515686,
"eval_runtime": 373.4872,
"eval_samples_per_second": 10.129,
"eval_steps_per_second": 0.161,
"step": 2700
},
{
"epoch": 10.01,
"grad_norm": 0.12537457048892975,
"learning_rate": 2.4832214765100674e-05,
"loss": 0.0651,
"step": 3000
},
{
"epoch": 10.01,
"eval_accuracy": 0.7909767441860465,
"eval_loss": 0.9051322937011719,
"eval_runtime": 375.6037,
"eval_samples_per_second": 10.072,
"eval_steps_per_second": 0.16,
"step": 3000
},
{
"epoch": 11.01,
"eval_accuracy": 0.790046511627907,
"eval_loss": 0.9593069553375244,
"eval_runtime": 375.7576,
"eval_samples_per_second": 10.068,
"eval_steps_per_second": 0.16,
"step": 3300
},
{
"epoch": 12.01,
"eval_accuracy": 0.8186976744186046,
"eval_loss": 0.8053779602050781,
"eval_runtime": 377.8682,
"eval_samples_per_second": 10.011,
"eval_steps_per_second": 0.159,
"step": 3600
},
{
"epoch": 13.01,
"eval_accuracy": 0.8142325581395349,
"eval_loss": 0.8678916692733765,
"eval_runtime": 376.9615,
"eval_samples_per_second": 10.036,
"eval_steps_per_second": 0.159,
"step": 3900
},
{
"epoch": 13.34,
"grad_norm": 10.020633697509766,
"learning_rate": 1.644295302013423e-05,
"loss": 0.0265,
"step": 4000
},
{
"epoch": 14.01,
"eval_accuracy": 0.8208372093023256,
"eval_loss": 0.8379742503166199,
"eval_runtime": 373.9706,
"eval_samples_per_second": 10.116,
"eval_steps_per_second": 0.16,
"step": 4200
},
{
"epoch": 15.01,
"eval_accuracy": 0.8246511627906977,
"eval_loss": 0.8317446708679199,
"eval_runtime": 375.9164,
"eval_samples_per_second": 10.063,
"eval_steps_per_second": 0.16,
"step": 4500
},
{
"epoch": 16.01,
"eval_accuracy": 0.8249302325581396,
"eval_loss": 0.8027446269989014,
"eval_runtime": 375.7325,
"eval_samples_per_second": 10.068,
"eval_steps_per_second": 0.16,
"step": 4800
},
{
"epoch": 16.67,
"grad_norm": 0.026239760220050812,
"learning_rate": 8.053691275167785e-06,
"loss": 0.0091,
"step": 5000
},
{
"epoch": 17.01,
"eval_accuracy": 0.8254883720930233,
"eval_loss": 0.8239758610725403,
"eval_runtime": 375.8655,
"eval_samples_per_second": 10.065,
"eval_steps_per_second": 0.16,
"step": 5100
},
{
"epoch": 18.01,
"eval_accuracy": 0.8211162790697675,
"eval_loss": 0.8480401039123535,
"eval_runtime": 375.7779,
"eval_samples_per_second": 10.067,
"eval_steps_per_second": 0.16,
"step": 5400
},
{
"epoch": 19.01,
"eval_accuracy": 0.8297674418604651,
"eval_loss": 0.8198431134223938,
"eval_runtime": 372.9411,
"eval_samples_per_second": 10.144,
"eval_steps_per_second": 0.161,
"step": 5700
},
{
"epoch": 19.87,
"eval_accuracy": 0.8282790697674418,
"eval_loss": 0.8315407037734985,
"eval_runtime": 376.729,
"eval_samples_per_second": 10.042,
"eval_steps_per_second": 0.159,
"step": 5960
},
{
"epoch": 19.87,
"step": 5960,
"total_flos": 2.3636640203347614e+20,
"train_loss": 0.3129509675422771,
"train_runtime": 26481.3321,
"train_samples_per_second": 7.203,
"train_steps_per_second": 0.225
}
],
"logging_steps": 1000,
"max_steps": 5960,
"num_input_tokens_seen": 0,
"num_train_epochs": 20,
"save_steps": 500,
"total_flos": 2.3636640203347614e+20,
"train_batch_size": 8,
"trial_name": null,
"trial_params": null
}