{ "best_metric": 0.014742416329681873, "best_model_checkpoint": "2025-02-05-15-01-55-swin-base-patch4-window7-224/checkpoint-824", "epoch": 10.0, "eval_steps": 500, "global_step": 1030, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "train_accuracy": 0.7412267317668599 }, { "epoch": 1.0, "grad_norm": 7.215459823608398, "learning_rate": 0.0002, "loss": 0.8621, "step": 103 }, { "epoch": 1.0, "eval_accuracy": 0.9283982126242466, "eval_error_rate": 0.0716017873757534, "eval_f1": 0.9232855071576657, "eval_loss": 0.2048601657152176, "eval_precision": 0.9404750520396078, "eval_recall": 0.9219512195121952, "eval_runtime": 9.8053, "eval_samples_per_second": 41.814, "eval_steps_per_second": 1.326, "eval_top1_accuracy": 0.9219512195121952, "step": 103 }, { "epoch": 2.0, "train_accuracy": 0.9104963384865744 }, { "epoch": 2.0, "grad_norm": 5.792384147644043, "learning_rate": 0.00017777777777777779, "loss": 0.3112, "step": 206 }, { "epoch": 2.0, "eval_accuracy": 0.9419247642637625, "eval_error_rate": 0.05807523573623752, "eval_f1": 0.9511052403372374, "eval_loss": 0.19439856708049774, "eval_precision": 0.9578945295266905, "eval_recall": 0.9536585365853658, "eval_runtime": 10.2259, "eval_samples_per_second": 40.094, "eval_steps_per_second": 1.271, "eval_top1_accuracy": 0.9536585365853658, "step": 206 }, { "epoch": 3.0, "train_accuracy": 0.951179820992677 }, { "epoch": 3.0, "grad_norm": 4.394165992736816, "learning_rate": 0.00015555555555555556, "loss": 0.1598, "step": 309 }, { "epoch": 3.0, "eval_accuracy": 0.9626822193906274, "eval_error_rate": 0.03731778060937263, "eval_f1": 0.96096931765473, "eval_loss": 0.16732054948806763, "eval_precision": 0.9635265490590446, "eval_recall": 0.9609756097560975, "eval_runtime": 9.666, "eval_samples_per_second": 42.417, "eval_steps_per_second": 1.345, "eval_top1_accuracy": 0.9609756097560975, "step": 309 }, { "epoch": 4.0, "train_accuracy": 0.9679956604285327 }, { "epoch": 4.0, "grad_norm": 0.13633428514003754, "learning_rate": 0.00013333333333333334, "loss": 0.1019, "step": 412 }, { "epoch": 4.0, "eval_accuracy": 0.9858430180433758, "eval_error_rate": 0.014156981956624182, "eval_f1": 0.9853262142550591, "eval_loss": 0.04716501012444496, "eval_precision": 0.9856189136067184, "eval_recall": 0.9853658536585366, "eval_runtime": 13.7463, "eval_samples_per_second": 29.826, "eval_steps_per_second": 0.946, "eval_top1_accuracy": 0.9853658536585366, "step": 412 }, { "epoch": 5.0, "train_accuracy": 0.9810143748304855 }, { "epoch": 5.0, "grad_norm": 0.03345122188329697, "learning_rate": 0.00011111111111111112, "loss": 0.0779, "step": 515 }, { "epoch": 5.0, "eval_accuracy": 0.9235918788691596, "eval_error_rate": 0.07640812113084039, "eval_f1": 0.9246101559573323, "eval_loss": 0.38690677285194397, "eval_precision": 0.9388475660562225, "eval_recall": 0.926829268292683, "eval_runtime": 10.1996, "eval_samples_per_second": 40.198, "eval_steps_per_second": 1.275, "eval_top1_accuracy": 0.926829268292683, "step": 515 }, { "epoch": 6.0, "train_accuracy": 0.9788445890968267 }, { "epoch": 6.0, "grad_norm": 0.026166679337620735, "learning_rate": 8.888888888888889e-05, "loss": 0.0519, "step": 618 }, { "epoch": 6.0, "eval_accuracy": 0.9851728474268724, "eval_error_rate": 0.014827152573127611, "eval_f1": 0.9852229541018859, "eval_loss": 0.022445783019065857, "eval_precision": 0.9857568348496367, "eval_recall": 0.9853658536585366, "eval_runtime": 10.1817, "eval_samples_per_second": 40.268, "eval_steps_per_second": 1.277, "eval_top1_accuracy": 0.9853658536585366, "step": 618 }, { "epoch": 7.0, "train_accuracy": 0.9902359641985354 }, { "epoch": 7.0, "grad_norm": 0.0006544096395373344, "learning_rate": 6.666666666666667e-05, "loss": 0.0477, "step": 721 }, { "epoch": 7.0, "eval_accuracy": 0.9885326361176093, "eval_error_rate": 0.011467363882390669, "eval_f1": 0.9878881102106918, "eval_loss": 0.04018908366560936, "eval_precision": 0.988658536585366, "eval_recall": 0.9878048780487805, "eval_runtime": 9.8013, "eval_samples_per_second": 41.831, "eval_steps_per_second": 1.326, "eval_top1_accuracy": 0.9878048780487805, "step": 721 }, { "epoch": 8.0, "train_accuracy": 0.9964740981828044 }, { "epoch": 8.0, "grad_norm": 0.007697376888245344, "learning_rate": 4.4444444444444447e-05, "loss": 0.0086, "step": 824 }, { "epoch": 8.0, "eval_accuracy": 0.9947104177873408, "eval_error_rate": 0.005289582212659183, "eval_f1": 0.9951305796069067, "eval_loss": 0.014742416329681873, "eval_precision": 0.9953221447399152, "eval_recall": 0.9951219512195122, "eval_runtime": 9.6919, "eval_samples_per_second": 42.303, "eval_steps_per_second": 1.341, "eval_top1_accuracy": 0.9951219512195122, "step": 824 }, { "epoch": 9.0, "train_accuracy": 0.9981014374830486 }, { "epoch": 9.0, "grad_norm": 0.0019185468554496765, "learning_rate": 2.2222222222222223e-05, "loss": 0.0052, "step": 927 }, { "epoch": 9.0, "eval_accuracy": 0.9947104177873408, "eval_error_rate": 0.005289582212659183, "eval_f1": 0.9951305796069067, "eval_loss": 0.017671354115009308, "eval_precision": 0.9953221447399152, "eval_recall": 0.9951219512195122, "eval_runtime": 9.5073, "eval_samples_per_second": 43.125, "eval_steps_per_second": 1.367, "eval_top1_accuracy": 0.9951219512195122, "step": 927 }, { "epoch": 10.0, "train_accuracy": 0.9989151071331706 }, { "epoch": 10.0, "grad_norm": 0.07999913394451141, "learning_rate": 0.0, "loss": 0.0022, "step": 1030 }, { "epoch": 10.0, "eval_accuracy": 0.9947104177873408, "eval_error_rate": 0.005289582212659183, "eval_f1": 0.9951305796069067, "eval_loss": 0.018023641780018806, "eval_precision": 0.9953221447399152, "eval_recall": 0.9951219512195122, "eval_runtime": 9.6269, "eval_samples_per_second": 42.589, "eval_steps_per_second": 1.35, "eval_top1_accuracy": 0.9951219512195122, "step": 1030 }, { "epoch": 10.0, "step": 1030, "total_flos": 2.5677175620237926e+18, "train_loss": 0.16285478193493721, "train_runtime": 1528.2748, "train_samples_per_second": 21.442, "train_steps_per_second": 0.674 } ], "logging_steps": 500, "max_steps": 1030, "num_input_tokens_seen": 0, "num_train_epochs": 10, "save_steps": 500, "stateful_callbacks": { "EarlyStoppingCallback": { "args": { "early_stopping_patience": 3, "early_stopping_threshold": 0.0 }, "attributes": { "early_stopping_patience_counter": 2 } }, "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 2.5677175620237926e+18, "train_batch_size": 32, "trial_name": null, "trial_params": null }