xls-r-53-it-italic-speaker / trainer_state.json
alkiskoudounas's picture
Upload with huggingface_hub
beb4f6b verified
{
"best_metric": 0.824220746039857,
"best_model_checkpoint": "wav2vec2-large-xlsr-53-italian-ic-finetuning-hard-speaker/checkpoint-2346",
"epoch": 29.99270072992701,
"global_step": 3060,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.49,
"learning_rate": 1.6013071895424836e-05,
"loss": 4.0662,
"step": 50
},
{
"epoch": 0.97,
"learning_rate": 3.169934640522876e-05,
"loss": 3.9284,
"step": 100
},
{
"epoch": 0.99,
"eval_accuracy": 0.057230454777721,
"eval_loss": 3.828322649002075,
"eval_runtime": 29.2471,
"eval_samples_per_second": 66.913,
"eval_steps_per_second": 2.12,
"step": 102
},
{
"epoch": 1.47,
"learning_rate": 4.803921568627452e-05,
"loss": 3.8316,
"step": 150
},
{
"epoch": 1.95,
"learning_rate": 6.405228758169934e-05,
"loss": 3.6033,
"step": 200
},
{
"epoch": 1.99,
"eval_accuracy": 0.18446601941747573,
"eval_loss": 3.325474262237549,
"eval_runtime": 29.2457,
"eval_samples_per_second": 66.916,
"eval_steps_per_second": 2.12,
"step": 204
},
{
"epoch": 2.45,
"learning_rate": 8.006535947712419e-05,
"loss": 3.2263,
"step": 250
},
{
"epoch": 2.93,
"learning_rate": 9.640522875816994e-05,
"loss": 2.7337,
"step": 300
},
{
"epoch": 2.99,
"eval_accuracy": 0.455799693408278,
"eval_loss": 2.375624895095825,
"eval_runtime": 29.1511,
"eval_samples_per_second": 67.133,
"eval_steps_per_second": 2.127,
"step": 306
},
{
"epoch": 3.43,
"learning_rate": 9.85838779956427e-05,
"loss": 2.2867,
"step": 350
},
{
"epoch": 3.91,
"learning_rate": 9.67683369644154e-05,
"loss": 1.8948,
"step": 400
},
{
"epoch": 3.99,
"eval_accuracy": 0.6075625958099131,
"eval_loss": 1.6275904178619385,
"eval_runtime": 29.219,
"eval_samples_per_second": 66.977,
"eval_steps_per_second": 2.122,
"step": 408
},
{
"epoch": 4.41,
"learning_rate": 9.49527959331881e-05,
"loss": 1.5128,
"step": 450
},
{
"epoch": 4.9,
"learning_rate": 9.313725490196079e-05,
"loss": 1.3163,
"step": 500
},
{
"epoch": 4.99,
"eval_accuracy": 0.7189575881451201,
"eval_loss": 1.2288696765899658,
"eval_runtime": 29.2646,
"eval_samples_per_second": 66.872,
"eval_steps_per_second": 2.119,
"step": 510
},
{
"epoch": 5.39,
"learning_rate": 9.132171387073348e-05,
"loss": 1.1049,
"step": 550
},
{
"epoch": 5.88,
"learning_rate": 8.950617283950617e-05,
"loss": 0.9525,
"step": 600
},
{
"epoch": 5.99,
"eval_accuracy": 0.7567705671946857,
"eval_loss": 1.070212960243225,
"eval_runtime": 29.2153,
"eval_samples_per_second": 66.985,
"eval_steps_per_second": 2.122,
"step": 612
},
{
"epoch": 6.37,
"learning_rate": 8.769063180827887e-05,
"loss": 0.7733,
"step": 650
},
{
"epoch": 6.86,
"learning_rate": 8.587509077705157e-05,
"loss": 0.7063,
"step": 700
},
{
"epoch": 6.99,
"eval_accuracy": 0.7797649463464487,
"eval_loss": 0.9915740489959717,
"eval_runtime": 29.2648,
"eval_samples_per_second": 66.872,
"eval_steps_per_second": 2.119,
"step": 714
},
{
"epoch": 7.35,
"learning_rate": 8.405954974582426e-05,
"loss": 0.6261,
"step": 750
},
{
"epoch": 7.84,
"learning_rate": 8.224400871459695e-05,
"loss": 0.5398,
"step": 800
},
{
"epoch": 7.99,
"eval_accuracy": 0.7797649463464487,
"eval_loss": 0.9585044980049133,
"eval_runtime": 29.2234,
"eval_samples_per_second": 66.967,
"eval_steps_per_second": 2.122,
"step": 816
},
{
"epoch": 8.33,
"learning_rate": 8.042846768336965e-05,
"loss": 0.4993,
"step": 850
},
{
"epoch": 8.82,
"learning_rate": 7.861292665214233e-05,
"loss": 0.4401,
"step": 900
},
{
"epoch": 8.99,
"eval_accuracy": 0.7894736842105263,
"eval_loss": 0.9442699551582336,
"eval_runtime": 29.2708,
"eval_samples_per_second": 66.858,
"eval_steps_per_second": 2.118,
"step": 918
},
{
"epoch": 9.31,
"learning_rate": 7.679738562091505e-05,
"loss": 0.3974,
"step": 950
},
{
"epoch": 9.8,
"learning_rate": 7.498184458968773e-05,
"loss": 0.3377,
"step": 1000
},
{
"epoch": 9.99,
"eval_accuracy": 0.7966274910577414,
"eval_loss": 0.9571655988693237,
"eval_runtime": 29.1828,
"eval_samples_per_second": 67.06,
"eval_steps_per_second": 2.125,
"step": 1020
},
{
"epoch": 10.29,
"learning_rate": 7.316630355846043e-05,
"loss": 0.2958,
"step": 1050
},
{
"epoch": 10.78,
"learning_rate": 7.135076252723311e-05,
"loss": 0.2903,
"step": 1100
},
{
"epoch": 10.99,
"eval_accuracy": 0.8114460909555442,
"eval_loss": 0.9565660357475281,
"eval_runtime": 29.2796,
"eval_samples_per_second": 66.838,
"eval_steps_per_second": 2.118,
"step": 1122
},
{
"epoch": 11.27,
"learning_rate": 6.953522149600581e-05,
"loss": 0.27,
"step": 1150
},
{
"epoch": 11.76,
"learning_rate": 6.771968046477851e-05,
"loss": 0.2313,
"step": 1200
},
{
"epoch": 11.99,
"eval_accuracy": 0.8160449667858968,
"eval_loss": 0.9552507996559143,
"eval_runtime": 29.3904,
"eval_samples_per_second": 66.586,
"eval_steps_per_second": 2.11,
"step": 1224
},
{
"epoch": 12.25,
"learning_rate": 6.590413943355121e-05,
"loss": 0.2222,
"step": 1250
},
{
"epoch": 12.74,
"learning_rate": 6.40885984023239e-05,
"loss": 0.196,
"step": 1300
},
{
"epoch": 12.99,
"eval_accuracy": 0.7976494634644865,
"eval_loss": 1.0041111707687378,
"eval_runtime": 29.2891,
"eval_samples_per_second": 66.817,
"eval_steps_per_second": 2.117,
"step": 1326
},
{
"epoch": 13.23,
"learning_rate": 6.22730573710966e-05,
"loss": 0.186,
"step": 1350
},
{
"epoch": 13.72,
"learning_rate": 6.045751633986928e-05,
"loss": 0.189,
"step": 1400
},
{
"epoch": 13.99,
"eval_accuracy": 0.8109351047521717,
"eval_loss": 1.0098705291748047,
"eval_runtime": 29.5324,
"eval_samples_per_second": 66.266,
"eval_steps_per_second": 2.099,
"step": 1428
},
{
"epoch": 14.21,
"learning_rate": 5.8641975308641984e-05,
"loss": 0.1511,
"step": 1450
},
{
"epoch": 14.7,
"learning_rate": 5.6826434277414676e-05,
"loss": 0.1253,
"step": 1500
},
{
"epoch": 14.99,
"eval_accuracy": 0.8119570771589167,
"eval_loss": 1.030671238899231,
"eval_runtime": 30.8165,
"eval_samples_per_second": 63.505,
"eval_steps_per_second": 2.012,
"step": 1530
},
{
"epoch": 15.19,
"learning_rate": 5.501089324618737e-05,
"loss": 0.1539,
"step": 1550
},
{
"epoch": 15.68,
"learning_rate": 5.319535221496006e-05,
"loss": 0.1114,
"step": 1600
},
{
"epoch": 15.99,
"eval_accuracy": 0.8048032703117016,
"eval_loss": 1.1111302375793457,
"eval_runtime": 30.7697,
"eval_samples_per_second": 63.601,
"eval_steps_per_second": 2.015,
"step": 1632
},
{
"epoch": 16.18,
"learning_rate": 5.137981118373275e-05,
"loss": 0.1331,
"step": 1650
},
{
"epoch": 16.66,
"learning_rate": 4.956427015250545e-05,
"loss": 0.1241,
"step": 1700
},
{
"epoch": 16.99,
"eval_accuracy": 0.8109351047521717,
"eval_loss": 1.0672301054000854,
"eval_runtime": 31.1401,
"eval_samples_per_second": 62.845,
"eval_steps_per_second": 1.991,
"step": 1734
},
{
"epoch": 17.16,
"learning_rate": 4.774872912127814e-05,
"loss": 0.0923,
"step": 1750
},
{
"epoch": 17.64,
"learning_rate": 4.593318809005084e-05,
"loss": 0.1128,
"step": 1800
},
{
"epoch": 17.99,
"eval_accuracy": 0.8119570771589167,
"eval_loss": 1.092710018157959,
"eval_runtime": 31.1388,
"eval_samples_per_second": 62.848,
"eval_steps_per_second": 1.991,
"step": 1836
},
{
"epoch": 18.14,
"learning_rate": 4.411764705882353e-05,
"loss": 0.0897,
"step": 1850
},
{
"epoch": 18.62,
"learning_rate": 4.230210602759623e-05,
"loss": 0.0932,
"step": 1900
},
{
"epoch": 18.99,
"eval_accuracy": 0.8185998978027593,
"eval_loss": 1.0788525342941284,
"eval_runtime": 31.2301,
"eval_samples_per_second": 62.664,
"eval_steps_per_second": 1.985,
"step": 1938
},
{
"epoch": 19.12,
"learning_rate": 4.048656499636892e-05,
"loss": 0.0849,
"step": 1950
},
{
"epoch": 19.6,
"learning_rate": 3.8671023965141615e-05,
"loss": 0.0889,
"step": 2000
},
{
"epoch": 19.99,
"eval_accuracy": 0.8104241185487991,
"eval_loss": 1.153747320175171,
"eval_runtime": 31.9386,
"eval_samples_per_second": 61.274,
"eval_steps_per_second": 1.941,
"step": 2040
},
{
"epoch": 20.1,
"learning_rate": 3.6855482933914306e-05,
"loss": 0.0732,
"step": 2050
},
{
"epoch": 20.58,
"learning_rate": 3.5039941902687e-05,
"loss": 0.0649,
"step": 2100
},
{
"epoch": 20.99,
"eval_accuracy": 0.8088911599386817,
"eval_loss": 1.1140419244766235,
"eval_runtime": 32.7576,
"eval_samples_per_second": 59.742,
"eval_steps_per_second": 1.893,
"step": 2142
},
{
"epoch": 21.08,
"learning_rate": 3.32244008714597e-05,
"loss": 0.061,
"step": 2150
},
{
"epoch": 21.56,
"learning_rate": 3.140885984023239e-05,
"loss": 0.0645,
"step": 2200
},
{
"epoch": 21.99,
"eval_accuracy": 0.8150229943791517,
"eval_loss": 1.133326530456543,
"eval_runtime": 31.5293,
"eval_samples_per_second": 62.069,
"eval_steps_per_second": 1.966,
"step": 2244
},
{
"epoch": 22.06,
"learning_rate": 2.9593318809005084e-05,
"loss": 0.0619,
"step": 2250
},
{
"epoch": 22.55,
"learning_rate": 2.777777777777778e-05,
"loss": 0.0637,
"step": 2300
},
{
"epoch": 22.99,
"eval_accuracy": 0.824220746039857,
"eval_loss": 1.1310803890228271,
"eval_runtime": 29.6669,
"eval_samples_per_second": 65.966,
"eval_steps_per_second": 2.09,
"step": 2346
},
{
"epoch": 23.04,
"learning_rate": 2.596223674655047e-05,
"loss": 0.0453,
"step": 2350
},
{
"epoch": 23.53,
"learning_rate": 2.4183006535947712e-05,
"loss": 0.0767,
"step": 2400
},
{
"epoch": 23.99,
"eval_accuracy": 0.8165559529892693,
"eval_loss": 1.1296130418777466,
"eval_runtime": 29.5997,
"eval_samples_per_second": 66.115,
"eval_steps_per_second": 2.095,
"step": 2448
},
{
"epoch": 24.02,
"learning_rate": 2.2367465504720407e-05,
"loss": 0.0446,
"step": 2450
},
{
"epoch": 24.51,
"learning_rate": 2.0551924473493103e-05,
"loss": 0.0571,
"step": 2500
},
{
"epoch": 24.99,
"learning_rate": 1.877269426289034e-05,
"loss": 0.0457,
"step": 2550
},
{
"epoch": 24.99,
"eval_accuracy": 0.8083801737353091,
"eval_loss": 1.168392539024353,
"eval_runtime": 29.5486,
"eval_samples_per_second": 66.23,
"eval_steps_per_second": 2.098,
"step": 2550
},
{
"epoch": 25.49,
"learning_rate": 1.6957153231663036e-05,
"loss": 0.0424,
"step": 2600
},
{
"epoch": 25.97,
"learning_rate": 1.5141612200435731e-05,
"loss": 0.0405,
"step": 2650
},
{
"epoch": 25.99,
"eval_accuracy": 0.8160449667858968,
"eval_loss": 1.1332188844680786,
"eval_runtime": 29.6263,
"eval_samples_per_second": 66.056,
"eval_steps_per_second": 2.093,
"step": 2652
},
{
"epoch": 26.47,
"learning_rate": 1.3326071169208426e-05,
"loss": 0.0454,
"step": 2700
},
{
"epoch": 26.95,
"learning_rate": 1.151053013798112e-05,
"loss": 0.0362,
"step": 2750
},
{
"epoch": 26.99,
"eval_accuracy": 0.8201328564128768,
"eval_loss": 1.131385087966919,
"eval_runtime": 29.8487,
"eval_samples_per_second": 65.564,
"eval_steps_per_second": 2.077,
"step": 2754
},
{
"epoch": 27.45,
"learning_rate": 9.694989106753813e-06,
"loss": 0.0337,
"step": 2800
},
{
"epoch": 27.93,
"learning_rate": 7.879448075526508e-06,
"loss": 0.0391,
"step": 2850
},
{
"epoch": 27.99,
"eval_accuracy": 0.8211548288196219,
"eval_loss": 1.1564393043518066,
"eval_runtime": 29.8613,
"eval_samples_per_second": 65.536,
"eval_steps_per_second": 2.076,
"step": 2856
},
{
"epoch": 28.43,
"learning_rate": 6.063907044299202e-06,
"loss": 0.0435,
"step": 2900
},
{
"epoch": 28.91,
"learning_rate": 4.2483660130718954e-06,
"loss": 0.0452,
"step": 2950
},
{
"epoch": 28.99,
"eval_accuracy": 0.8221768012263669,
"eval_loss": 1.1484907865524292,
"eval_runtime": 29.975,
"eval_samples_per_second": 65.288,
"eval_steps_per_second": 2.068,
"step": 2958
},
{
"epoch": 29.41,
"learning_rate": 2.43282498184459e-06,
"loss": 0.0484,
"step": 3000
},
{
"epoch": 29.9,
"learning_rate": 6.17283950617284e-07,
"loss": 0.0343,
"step": 3050
},
{
"epoch": 29.99,
"eval_accuracy": 0.8201328564128768,
"eval_loss": 1.1464686393737793,
"eval_runtime": 29.8646,
"eval_samples_per_second": 65.529,
"eval_steps_per_second": 2.076,
"step": 3060
}
],
"max_steps": 3060,
"num_train_epochs": 30,
"total_flos": 1.1930235995944326e+20,
"trial_name": null,
"trial_params": null
}