{ "best_metric": 0.8297674418604651, "best_model_checkpoint": "video/train/checkpoint/videomae-base/ucf101_42/checkpoint-5700", "epoch": 19.871751886001675, "eval_steps": 500, "global_step": 5960, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.01, "eval_accuracy": 0.4886511627906977, "eval_loss": 2.334453582763672, "eval_runtime": 390.4063, "eval_samples_per_second": 9.69, "eval_steps_per_second": 0.154, "step": 300 }, { "epoch": 2.01, "eval_accuracy": 0.6433488372093024, "eval_loss": 1.4956246614456177, "eval_runtime": 378.3625, "eval_samples_per_second": 9.998, "eval_steps_per_second": 0.159, "step": 600 }, { "epoch": 3.01, "eval_accuracy": 0.7161860465116279, "eval_loss": 1.1646597385406494, "eval_runtime": 374.5393, "eval_samples_per_second": 10.1, "eval_steps_per_second": 0.16, "step": 900 }, { "epoch": 3.34, "grad_norm": 6.9290690422058105, "learning_rate": 4.161073825503356e-05, "loss": 1.5784, "step": 1000 }, { "epoch": 4.01, "eval_accuracy": 0.7028837209302325, "eval_loss": 1.1531013250350952, "eval_runtime": 376.3709, "eval_samples_per_second": 10.051, "eval_steps_per_second": 0.159, "step": 1200 }, { "epoch": 5.01, "eval_accuracy": 0.7333953488372092, "eval_loss": 1.0251258611679077, "eval_runtime": 377.2789, "eval_samples_per_second": 10.027, "eval_steps_per_second": 0.159, "step": 1500 }, { "epoch": 6.01, "eval_accuracy": 0.7333023255813953, "eval_loss": 1.031457781791687, "eval_runtime": 376.6891, "eval_samples_per_second": 10.043, "eval_steps_per_second": 0.159, "step": 1800 }, { "epoch": 6.67, "grad_norm": 7.911869049072266, "learning_rate": 3.3221476510067115e-05, "loss": 0.1821, "step": 2000 }, { "epoch": 7.01, "eval_accuracy": 0.7616744186046511, "eval_loss": 0.9787126779556274, "eval_runtime": 379.965, "eval_samples_per_second": 9.956, "eval_steps_per_second": 0.158, "step": 2100 }, { "epoch": 8.01, "eval_accuracy": 0.7838139534883721, "eval_loss": 0.8932655453681946, "eval_runtime": 375.8521, "eval_samples_per_second": 10.065, "eval_steps_per_second": 0.16, "step": 2400 }, { "epoch": 9.01, "eval_accuracy": 0.7917209302325582, "eval_loss": 0.8780561089515686, "eval_runtime": 373.4872, "eval_samples_per_second": 10.129, "eval_steps_per_second": 0.161, "step": 2700 }, { "epoch": 10.01, "grad_norm": 0.12537457048892975, "learning_rate": 2.4832214765100674e-05, "loss": 0.0651, "step": 3000 }, { "epoch": 10.01, "eval_accuracy": 0.7909767441860465, "eval_loss": 0.9051322937011719, "eval_runtime": 375.6037, "eval_samples_per_second": 10.072, "eval_steps_per_second": 0.16, "step": 3000 }, { "epoch": 11.01, "eval_accuracy": 0.790046511627907, "eval_loss": 0.9593069553375244, "eval_runtime": 375.7576, "eval_samples_per_second": 10.068, "eval_steps_per_second": 0.16, "step": 3300 }, { "epoch": 12.01, "eval_accuracy": 0.8186976744186046, "eval_loss": 0.8053779602050781, "eval_runtime": 377.8682, "eval_samples_per_second": 10.011, "eval_steps_per_second": 0.159, "step": 3600 }, { "epoch": 13.01, "eval_accuracy": 0.8142325581395349, "eval_loss": 0.8678916692733765, "eval_runtime": 376.9615, "eval_samples_per_second": 10.036, "eval_steps_per_second": 0.159, "step": 3900 }, { "epoch": 13.34, "grad_norm": 10.020633697509766, "learning_rate": 1.644295302013423e-05, "loss": 0.0265, "step": 4000 }, { "epoch": 14.01, "eval_accuracy": 0.8208372093023256, "eval_loss": 0.8379742503166199, "eval_runtime": 373.9706, "eval_samples_per_second": 10.116, "eval_steps_per_second": 0.16, "step": 4200 }, { "epoch": 15.01, "eval_accuracy": 0.8246511627906977, "eval_loss": 0.8317446708679199, "eval_runtime": 375.9164, "eval_samples_per_second": 10.063, "eval_steps_per_second": 0.16, "step": 4500 }, { "epoch": 16.01, "eval_accuracy": 0.8249302325581396, "eval_loss": 0.8027446269989014, "eval_runtime": 375.7325, "eval_samples_per_second": 10.068, "eval_steps_per_second": 0.16, "step": 4800 }, { "epoch": 16.67, "grad_norm": 0.026239760220050812, "learning_rate": 8.053691275167785e-06, "loss": 0.0091, "step": 5000 }, { "epoch": 17.01, "eval_accuracy": 0.8254883720930233, "eval_loss": 0.8239758610725403, "eval_runtime": 375.8655, "eval_samples_per_second": 10.065, "eval_steps_per_second": 0.16, "step": 5100 }, { "epoch": 18.01, "eval_accuracy": 0.8211162790697675, "eval_loss": 0.8480401039123535, "eval_runtime": 375.7779, "eval_samples_per_second": 10.067, "eval_steps_per_second": 0.16, "step": 5400 }, { "epoch": 19.01, "eval_accuracy": 0.8297674418604651, "eval_loss": 0.8198431134223938, "eval_runtime": 372.9411, "eval_samples_per_second": 10.144, "eval_steps_per_second": 0.161, "step": 5700 }, { "epoch": 19.87, "eval_accuracy": 0.8282790697674418, "eval_loss": 0.8315407037734985, "eval_runtime": 376.729, "eval_samples_per_second": 10.042, "eval_steps_per_second": 0.159, "step": 5960 }, { "epoch": 19.87, "step": 5960, "total_flos": 2.3636640203347614e+20, "train_loss": 0.3129509675422771, "train_runtime": 26481.3321, "train_samples_per_second": 7.203, "train_steps_per_second": 0.225 } ], "logging_steps": 1000, "max_steps": 5960, "num_input_tokens_seen": 0, "num_train_epochs": 20, "save_steps": 500, "total_flos": 2.3636640203347614e+20, "train_batch_size": 8, "trial_name": null, "trial_params": null }