SodaXII's picture
Model save
c223834 verified
{
"best_metric": 0.3229925036430359,
"best_model_checkpoint": "./drive/Shareddrives/CS198-Drones/[v4] Training Output/efficientnet-b0_rice-leaf-disease-augmented-v4_fft/checkpoint-1728",
"epoch": 15.0,
"eval_steps": 64,
"global_step": 1920,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.5,
"grad_norm": 1.9023804664611816,
"learning_rate": 7.5e-06,
"loss": 2.0658,
"step": 64
},
{
"epoch": 0.5,
"eval_accuracy": 0.24496644295302014,
"eval_loss": 1.9986859560012817,
"eval_runtime": 5.8944,
"eval_samples_per_second": 50.557,
"eval_steps_per_second": 0.848,
"step": 64
},
{
"epoch": 1.0,
"grad_norm": 1.8835070133209229,
"learning_rate": 1.5e-05,
"loss": 1.9318,
"step": 128
},
{
"epoch": 1.0,
"eval_accuracy": 0.4261744966442953,
"eval_loss": 1.7966947555541992,
"eval_runtime": 6.6797,
"eval_samples_per_second": 44.613,
"eval_steps_per_second": 0.749,
"step": 128
},
{
"epoch": 1.5,
"grad_norm": 1.9900165796279907,
"learning_rate": 2.25e-05,
"loss": 1.6451,
"step": 192
},
{
"epoch": 1.5,
"eval_accuracy": 0.5604026845637584,
"eval_loss": 1.4542900323867798,
"eval_runtime": 5.8004,
"eval_samples_per_second": 51.375,
"eval_steps_per_second": 0.862,
"step": 192
},
{
"epoch": 2.0,
"grad_norm": 2.0631637573242188,
"learning_rate": 3e-05,
"loss": 1.2851,
"step": 256
},
{
"epoch": 2.0,
"eval_accuracy": 0.6845637583892618,
"eval_loss": 1.0677685737609863,
"eval_runtime": 6.7517,
"eval_samples_per_second": 44.137,
"eval_steps_per_second": 0.741,
"step": 256
},
{
"epoch": 2.5,
"grad_norm": 2.0110857486724854,
"learning_rate": 2.9025243640281226e-05,
"loss": 0.9017,
"step": 320
},
{
"epoch": 2.5,
"eval_accuracy": 0.761744966442953,
"eval_loss": 0.8011165261268616,
"eval_runtime": 5.7914,
"eval_samples_per_second": 51.456,
"eval_steps_per_second": 0.863,
"step": 320
},
{
"epoch": 3.0,
"grad_norm": 1.901694416999817,
"learning_rate": 2.6227661222566516e-05,
"loss": 0.6891,
"step": 384
},
{
"epoch": 3.0,
"eval_accuracy": 0.8053691275167785,
"eval_loss": 0.6283528208732605,
"eval_runtime": 5.4903,
"eval_samples_per_second": 54.278,
"eval_steps_per_second": 0.911,
"step": 384
},
{
"epoch": 3.5,
"grad_norm": 2.0307912826538086,
"learning_rate": 2.197084758065653e-05,
"loss": 0.5118,
"step": 448
},
{
"epoch": 3.5,
"eval_accuracy": 0.802013422818792,
"eval_loss": 0.6123932600021362,
"eval_runtime": 6.3097,
"eval_samples_per_second": 47.229,
"eval_steps_per_second": 0.792,
"step": 448
},
{
"epoch": 4.0,
"grad_norm": 2.4103055000305176,
"learning_rate": 1.6808050203829845e-05,
"loss": 0.4458,
"step": 512
},
{
"epoch": 4.0,
"eval_accuracy": 0.8120805369127517,
"eval_loss": 0.6052291393280029,
"eval_runtime": 6.2959,
"eval_samples_per_second": 47.332,
"eval_steps_per_second": 0.794,
"step": 512
},
{
"epoch": 4.5,
"grad_norm": 1.8820128440856934,
"learning_rate": 1.1410265035686632e-05,
"loss": 0.356,
"step": 576
},
{
"epoch": 4.5,
"eval_accuracy": 0.8288590604026845,
"eval_loss": 0.5032140016555786,
"eval_runtime": 5.9496,
"eval_samples_per_second": 50.087,
"eval_steps_per_second": 0.84,
"step": 576
},
{
"epoch": 5.0,
"grad_norm": 1.9764384031295776,
"learning_rate": 6.479028799032664e-06,
"loss": 0.3255,
"step": 640
},
{
"epoch": 5.0,
"eval_accuracy": 0.8523489932885906,
"eval_loss": 0.44292640686035156,
"eval_runtime": 5.3491,
"eval_samples_per_second": 55.71,
"eval_steps_per_second": 0.935,
"step": 640
},
{
"epoch": 5.5,
"grad_norm": 1.9877854585647583,
"learning_rate": 2.6552420115951546e-06,
"loss": 0.294,
"step": 704
},
{
"epoch": 5.5,
"eval_accuracy": 0.8489932885906041,
"eval_loss": 0.48286402225494385,
"eval_runtime": 5.3534,
"eval_samples_per_second": 55.665,
"eval_steps_per_second": 0.934,
"step": 704
},
{
"epoch": 6.0,
"grad_norm": 1.8483781814575195,
"learning_rate": 4.3587273860921985e-07,
"loss": 0.2856,
"step": 768
},
{
"epoch": 6.0,
"eval_accuracy": 0.8389261744966443,
"eval_loss": 0.48628225922584534,
"eval_runtime": 5.4523,
"eval_samples_per_second": 54.656,
"eval_steps_per_second": 0.917,
"step": 768
},
{
"epoch": 6.5,
"grad_norm": 1.8444066047668457,
"learning_rate": 2.989063311147081e-05,
"loss": 0.289,
"step": 832
},
{
"epoch": 6.5,
"eval_accuracy": 0.8523489932885906,
"eval_loss": 0.4306166470050812,
"eval_runtime": 5.5498,
"eval_samples_per_second": 53.696,
"eval_steps_per_second": 0.901,
"step": 832
},
{
"epoch": 7.0,
"grad_norm": 1.8012785911560059,
"learning_rate": 2.8281840384798147e-05,
"loss": 0.2357,
"step": 896
},
{
"epoch": 7.0,
"eval_accuracy": 0.8590604026845637,
"eval_loss": 0.44078949093818665,
"eval_runtime": 5.421,
"eval_samples_per_second": 54.972,
"eval_steps_per_second": 0.922,
"step": 896
},
{
"epoch": 7.5,
"grad_norm": 1.9915043115615845,
"learning_rate": 2.494683987361193e-05,
"loss": 0.183,
"step": 960
},
{
"epoch": 7.5,
"eval_accuracy": 0.8691275167785235,
"eval_loss": 0.38100528717041016,
"eval_runtime": 6.1836,
"eval_samples_per_second": 48.192,
"eval_steps_per_second": 0.809,
"step": 960
},
{
"epoch": 8.0,
"grad_norm": 1.6568807363510132,
"learning_rate": 2.031907330563804e-05,
"loss": 0.1446,
"step": 1024
},
{
"epoch": 8.0,
"eval_accuracy": 0.8624161073825504,
"eval_loss": 0.3679770529270172,
"eval_runtime": 6.3939,
"eval_samples_per_second": 46.607,
"eval_steps_per_second": 0.782,
"step": 1024
},
{
"epoch": 8.5,
"grad_norm": 1.1750797033309937,
"learning_rate": 1.5e-05,
"loss": 0.1094,
"step": 1088
},
{
"epoch": 8.5,
"eval_accuracy": 0.8825503355704698,
"eval_loss": 0.35567012429237366,
"eval_runtime": 5.773,
"eval_samples_per_second": 51.62,
"eval_steps_per_second": 0.866,
"step": 1088
},
{
"epoch": 9.0,
"grad_norm": 1.8476396799087524,
"learning_rate": 9.680926694361966e-06,
"loss": 0.102,
"step": 1152
},
{
"epoch": 9.0,
"eval_accuracy": 0.8825503355704698,
"eval_loss": 0.3554769456386566,
"eval_runtime": 6.2043,
"eval_samples_per_second": 48.031,
"eval_steps_per_second": 0.806,
"step": 1152
},
{
"epoch": 9.5,
"grad_norm": 1.0202888250350952,
"learning_rate": 5.053160126388081e-06,
"loss": 0.0752,
"step": 1216
},
{
"epoch": 9.5,
"eval_accuracy": 0.8825503355704698,
"eval_loss": 0.3513905107975006,
"eval_runtime": 6.2026,
"eval_samples_per_second": 48.044,
"eval_steps_per_second": 0.806,
"step": 1216
},
{
"epoch": 10.0,
"grad_norm": 1.4681854248046875,
"learning_rate": 1.7181596152018497e-06,
"loss": 0.0828,
"step": 1280
},
{
"epoch": 10.0,
"eval_accuracy": 0.8691275167785235,
"eval_loss": 0.4008277654647827,
"eval_runtime": 6.251,
"eval_samples_per_second": 47.673,
"eval_steps_per_second": 0.8,
"step": 1280
},
{
"epoch": 10.5,
"grad_norm": 0.9785635471343994,
"learning_rate": 1.0936688852918875e-07,
"loss": 0.0758,
"step": 1344
},
{
"epoch": 10.5,
"eval_accuracy": 0.8791946308724832,
"eval_loss": 0.35087850689888,
"eval_runtime": 5.9492,
"eval_samples_per_second": 50.091,
"eval_steps_per_second": 0.84,
"step": 1344
},
{
"epoch": 11.0,
"grad_norm": 0.5723533034324646,
"learning_rate": 2.9564127261390784e-05,
"loss": 0.0699,
"step": 1408
},
{
"epoch": 11.0,
"eval_accuracy": 0.889261744966443,
"eval_loss": 0.3736562132835388,
"eval_runtime": 6.3982,
"eval_samples_per_second": 46.575,
"eval_steps_per_second": 0.781,
"step": 1408
},
{
"epoch": 11.5,
"grad_norm": 1.2858341932296753,
"learning_rate": 2.7344757988404852e-05,
"loss": 0.059,
"step": 1472
},
{
"epoch": 11.5,
"eval_accuracy": 0.8859060402684564,
"eval_loss": 0.34882599115371704,
"eval_runtime": 6.2139,
"eval_samples_per_second": 47.957,
"eval_steps_per_second": 0.805,
"step": 1472
},
{
"epoch": 12.0,
"grad_norm": 1.8073585033416748,
"learning_rate": 2.352097120096733e-05,
"loss": 0.0504,
"step": 1536
},
{
"epoch": 12.0,
"eval_accuracy": 0.9026845637583892,
"eval_loss": 0.3544101119041443,
"eval_runtime": 5.7224,
"eval_samples_per_second": 52.076,
"eval_steps_per_second": 0.874,
"step": 1536
},
{
"epoch": 12.5,
"grad_norm": 0.7392011880874634,
"learning_rate": 1.8589734964313355e-05,
"loss": 0.0381,
"step": 1600
},
{
"epoch": 12.5,
"eval_accuracy": 0.8926174496644296,
"eval_loss": 0.38668006658554077,
"eval_runtime": 5.6939,
"eval_samples_per_second": 52.337,
"eval_steps_per_second": 0.878,
"step": 1600
},
{
"epoch": 13.0,
"grad_norm": 0.3402092158794403,
"learning_rate": 1.319194979617016e-05,
"loss": 0.0293,
"step": 1664
},
{
"epoch": 13.0,
"eval_accuracy": 0.889261744966443,
"eval_loss": 0.35926553606987,
"eval_runtime": 5.3061,
"eval_samples_per_second": 56.161,
"eval_steps_per_second": 0.942,
"step": 1664
},
{
"epoch": 13.5,
"grad_norm": 0.38678640127182007,
"learning_rate": 8.029152419343479e-06,
"loss": 0.0257,
"step": 1728
},
{
"epoch": 13.5,
"eval_accuracy": 0.8993288590604027,
"eval_loss": 0.3229925036430359,
"eval_runtime": 5.3086,
"eval_samples_per_second": 56.135,
"eval_steps_per_second": 0.942,
"step": 1728
},
{
"epoch": 14.0,
"grad_norm": 0.9726854562759399,
"learning_rate": 3.772338777433487e-06,
"loss": 0.0258,
"step": 1792
},
{
"epoch": 14.0,
"eval_accuracy": 0.889261744966443,
"eval_loss": 0.4092034101486206,
"eval_runtime": 5.3013,
"eval_samples_per_second": 56.212,
"eval_steps_per_second": 0.943,
"step": 1792
},
{
"epoch": 14.5,
"grad_norm": 2.582404136657715,
"learning_rate": 9.747563597187792e-07,
"loss": 0.0249,
"step": 1856
},
{
"epoch": 14.5,
"eval_accuracy": 0.8859060402684564,
"eval_loss": 0.4290601909160614,
"eval_runtime": 5.279,
"eval_samples_per_second": 56.45,
"eval_steps_per_second": 0.947,
"step": 1856
},
{
"epoch": 15.0,
"grad_norm": 0.6526421904563904,
"learning_rate": 0.0,
"loss": 0.0187,
"step": 1920
},
{
"epoch": 15.0,
"eval_accuracy": 0.8993288590604027,
"eval_loss": 0.3305014669895172,
"eval_runtime": 5.2462,
"eval_samples_per_second": 56.803,
"eval_steps_per_second": 0.953,
"step": 1920
},
{
"epoch": 15.0,
"step": 1920,
"total_flos": 4.4590015828721664e+17,
"train_loss": 0.4125567433113853,
"train_runtime": 3265.3981,
"train_samples_per_second": 37.631,
"train_steps_per_second": 0.588
}
],
"logging_steps": 64,
"max_steps": 1920,
"num_input_tokens_seen": 0,
"num_train_epochs": 15,
"save_steps": 64,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 4.4590015828721664e+17,
"train_batch_size": 64,
"trial_name": null,
"trial_params": null
}