segformer-finetuned-tt-1000-2k / trainer_state.json
Saumya-Mundra's picture
End of training
583ef42 verified
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 160.0,
"eval_steps": 500,
"global_step": 20000,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.8,
"grad_norm": 2.1959376335144043,
"learning_rate": 5.7005e-05,
"loss": 0.3719,
"step": 100
},
{
"epoch": 1.0,
"eval_accuracy_no_text": 0.96844593139048,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.96844593139048,
"eval_iou_text": 0.0,
"eval_loss": 0.19860416650772095,
"eval_mean_accuracy": 0.96844593139048,
"eval_mean_iou": 0.48422296569524,
"eval_overall_accuracy": 0.96844593139048,
"eval_runtime": 8.3086,
"eval_samples_per_second": 30.571,
"eval_steps_per_second": 3.851,
"step": 125
},
{
"epoch": 1.6,
"grad_norm": 1.968083381652832,
"learning_rate": 5.401e-05,
"loss": 0.2348,
"step": 200
},
{
"epoch": 2.0,
"eval_accuracy_no_text": 0.9864023804798262,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9864023804798262,
"eval_iou_text": 0.0,
"eval_loss": 0.1335889846086502,
"eval_mean_accuracy": 0.9864023804798262,
"eval_mean_iou": 0.4932011902399131,
"eval_overall_accuracy": 0.9864023804798262,
"eval_runtime": 8.1245,
"eval_samples_per_second": 31.263,
"eval_steps_per_second": 3.939,
"step": 250
},
{
"epoch": 2.4,
"grad_norm": 11.673813819885254,
"learning_rate": 5.1015e-05,
"loss": 0.183,
"step": 300
},
{
"epoch": 3.0,
"eval_accuracy_no_text": 0.9747427016305941,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9747427016305941,
"eval_iou_text": 0.0,
"eval_loss": 0.1268119513988495,
"eval_mean_accuracy": 0.9747427016305941,
"eval_mean_iou": 0.48737135081529703,
"eval_overall_accuracy": 0.9747427016305941,
"eval_runtime": 8.1397,
"eval_samples_per_second": 31.205,
"eval_steps_per_second": 3.931,
"step": 375
},
{
"epoch": 3.2,
"grad_norm": 2.0944621562957764,
"learning_rate": 4.8020000000000004e-05,
"loss": 0.1683,
"step": 400
},
{
"epoch": 4.0,
"grad_norm": 1.8507691621780396,
"learning_rate": 4.5025000000000003e-05,
"loss": 0.1485,
"step": 500
},
{
"epoch": 4.0,
"eval_accuracy_no_text": 0.9801620699547168,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9801620699547168,
"eval_iou_text": 0.0,
"eval_loss": 0.111358642578125,
"eval_mean_accuracy": 0.9801620699547168,
"eval_mean_iou": 0.4900810349773584,
"eval_overall_accuracy": 0.9801620699547168,
"eval_runtime": 8.1347,
"eval_samples_per_second": 31.224,
"eval_steps_per_second": 3.934,
"step": 500
},
{
"epoch": 4.8,
"grad_norm": 0.7507067322731018,
"learning_rate": 4.203e-05,
"loss": 0.1429,
"step": 600
},
{
"epoch": 5.0,
"eval_accuracy_no_text": 0.9756961862525911,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9756961862525911,
"eval_iou_text": 0.0,
"eval_loss": 0.11220362782478333,
"eval_mean_accuracy": 0.9756961862525911,
"eval_mean_iou": 0.48784809312629557,
"eval_overall_accuracy": 0.9756961862525911,
"eval_runtime": 8.1643,
"eval_samples_per_second": 31.111,
"eval_steps_per_second": 3.92,
"step": 625
},
{
"epoch": 5.6,
"grad_norm": 1.759697437286377,
"learning_rate": 3.9035e-05,
"loss": 0.1367,
"step": 700
},
{
"epoch": 6.0,
"eval_accuracy_no_text": 0.9834463870725529,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9834463870725529,
"eval_iou_text": 0.0,
"eval_loss": 0.10746461898088455,
"eval_mean_accuracy": 0.9834463870725529,
"eval_mean_iou": 0.49172319353627647,
"eval_overall_accuracy": 0.9834463870725529,
"eval_runtime": 8.1727,
"eval_samples_per_second": 31.079,
"eval_steps_per_second": 3.915,
"step": 750
},
{
"epoch": 6.4,
"grad_norm": 0.7061517238616943,
"learning_rate": 3.604e-05,
"loss": 0.1333,
"step": 800
},
{
"epoch": 7.0,
"eval_accuracy_no_text": 0.9793181982638223,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9793181982638223,
"eval_iou_text": 0.0,
"eval_loss": 0.10477758198976517,
"eval_mean_accuracy": 0.9793181982638223,
"eval_mean_iou": 0.48965909913191114,
"eval_overall_accuracy": 0.9793181982638223,
"eval_runtime": 8.2604,
"eval_samples_per_second": 30.749,
"eval_steps_per_second": 3.874,
"step": 875
},
{
"epoch": 7.2,
"grad_norm": 0.3624698519706726,
"learning_rate": 3.3045000000000006e-05,
"loss": 0.1299,
"step": 900
},
{
"epoch": 8.0,
"grad_norm": 0.8047678470611572,
"learning_rate": 3.0050000000000002e-05,
"loss": 0.1199,
"step": 1000
},
{
"epoch": 8.0,
"eval_accuracy_no_text": 0.9775670830889114,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9775670830889114,
"eval_iou_text": 0.0,
"eval_loss": 0.10090366005897522,
"eval_mean_accuracy": 0.9775670830889114,
"eval_mean_iou": 0.4887835415444557,
"eval_overall_accuracy": 0.9775670830889114,
"eval_runtime": 8.1621,
"eval_samples_per_second": 31.12,
"eval_steps_per_second": 3.921,
"step": 1000
},
{
"epoch": 8.8,
"grad_norm": 1.3916865587234497,
"learning_rate": 2.7054999999999998e-05,
"loss": 0.1201,
"step": 1100
},
{
"epoch": 9.0,
"eval_accuracy_no_text": 0.9805578030424941,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9805578030424941,
"eval_iou_text": 0.0,
"eval_loss": 0.10001751780509949,
"eval_mean_accuracy": 0.9805578030424941,
"eval_mean_iou": 0.49027890152124703,
"eval_overall_accuracy": 0.9805578030424941,
"eval_runtime": 8.1675,
"eval_samples_per_second": 31.099,
"eval_steps_per_second": 3.918,
"step": 1125
},
{
"epoch": 9.6,
"grad_norm": 0.953816831111908,
"learning_rate": 2.406e-05,
"loss": 0.1111,
"step": 1200
},
{
"epoch": 10.0,
"eval_accuracy_no_text": 0.9807101179946566,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9807101179946566,
"eval_iou_text": 0.0,
"eval_loss": 0.09977567940950394,
"eval_mean_accuracy": 0.9807101179946566,
"eval_mean_iou": 0.4903550589973283,
"eval_overall_accuracy": 0.9807101179946566,
"eval_runtime": 8.2219,
"eval_samples_per_second": 30.893,
"eval_steps_per_second": 3.892,
"step": 1250
},
{
"epoch": 10.4,
"grad_norm": 0.571890652179718,
"learning_rate": 2.1065e-05,
"loss": 0.1128,
"step": 1300
},
{
"epoch": 11.0,
"eval_accuracy_no_text": 0.9791675947156165,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9791675947156165,
"eval_iou_text": 0.0,
"eval_loss": 0.09842447936534882,
"eval_mean_accuracy": 0.9791675947156165,
"eval_mean_iou": 0.48958379735780827,
"eval_overall_accuracy": 0.9791675947156165,
"eval_runtime": 8.6895,
"eval_samples_per_second": 29.231,
"eval_steps_per_second": 3.683,
"step": 1375
},
{
"epoch": 11.2,
"grad_norm": 18.250076293945312,
"learning_rate": 1.807e-05,
"loss": 0.1108,
"step": 1400
},
{
"epoch": 12.0,
"grad_norm": 1.173434853553772,
"learning_rate": 1.5075000000000002e-05,
"loss": 0.1055,
"step": 1500
},
{
"epoch": 12.0,
"eval_accuracy_no_text": 0.9835118690433692,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9835118690433692,
"eval_iou_text": 0.0,
"eval_loss": 0.09405940771102905,
"eval_mean_accuracy": 0.9835118690433692,
"eval_mean_iou": 0.4917559345216846,
"eval_overall_accuracy": 0.9835118690433692,
"eval_runtime": 8.3821,
"eval_samples_per_second": 30.303,
"eval_steps_per_second": 3.818,
"step": 1500
},
{
"epoch": 12.8,
"grad_norm": 0.7602437734603882,
"learning_rate": 1.2079999999999998e-05,
"loss": 0.0988,
"step": 1600
},
{
"epoch": 13.0,
"eval_accuracy_no_text": 0.9814864806149025,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9814864806149025,
"eval_iou_text": 0.0,
"eval_loss": 0.09721452742815018,
"eval_mean_accuracy": 0.9814864806149025,
"eval_mean_iou": 0.49074324030745126,
"eval_overall_accuracy": 0.9814864806149025,
"eval_runtime": 8.2417,
"eval_samples_per_second": 30.819,
"eval_steps_per_second": 3.883,
"step": 1625
},
{
"epoch": 13.6,
"grad_norm": 3.4168713092803955,
"learning_rate": 9.085000000000002e-06,
"loss": 0.0983,
"step": 1700
},
{
"epoch": 14.0,
"eval_accuracy_no_text": 0.9842781460111701,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9842781460111701,
"eval_iou_text": 0.0,
"eval_loss": 0.09473416209220886,
"eval_mean_accuracy": 0.9842781460111701,
"eval_mean_iou": 0.49213907300558507,
"eval_overall_accuracy": 0.9842781460111701,
"eval_runtime": 8.2345,
"eval_samples_per_second": 30.846,
"eval_steps_per_second": 3.886,
"step": 1750
},
{
"epoch": 14.4,
"grad_norm": 4.172765254974365,
"learning_rate": 6.0899999999999984e-06,
"loss": 0.1045,
"step": 1800
},
{
"epoch": 15.0,
"eval_accuracy_no_text": 0.9793696566915354,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9793696566915354,
"eval_iou_text": 0.0,
"eval_loss": 0.09600792080163956,
"eval_mean_accuracy": 0.9793696566915354,
"eval_mean_iou": 0.4896848283457677,
"eval_overall_accuracy": 0.9793696566915354,
"eval_runtime": 8.2507,
"eval_samples_per_second": 30.785,
"eval_steps_per_second": 3.878,
"step": 1875
},
{
"epoch": 15.2,
"grad_norm": 1.797450065612793,
"learning_rate": 3.0950000000000026e-06,
"loss": 0.1047,
"step": 1900
},
{
"epoch": 16.0,
"grad_norm": 1.1411088705062866,
"learning_rate": 1e-07,
"loss": 0.1002,
"step": 2000
},
{
"epoch": 16.0,
"eval_accuracy_no_text": 0.9789534698341376,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9789534698341376,
"eval_iou_text": 0.0,
"eval_loss": 0.09761390835046768,
"eval_mean_accuracy": 0.9789534698341376,
"eval_mean_iou": 0.4894767349170688,
"eval_overall_accuracy": 0.9789534698341376,
"eval_runtime": 8.4956,
"eval_samples_per_second": 29.898,
"eval_steps_per_second": 3.767,
"step": 2000
},
{
"epoch": 16.8,
"grad_norm": 1.944307565689087,
"learning_rate": 5.37105e-05,
"loss": 0.1072,
"step": 2100
},
{
"epoch": 17.0,
"eval_accuracy_no_text": 0.9776347749308564,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9776347749308564,
"eval_iou_text": 0.0,
"eval_loss": 0.10060456395149231,
"eval_mean_accuracy": 0.9776347749308564,
"eval_mean_iou": 0.4888173874654282,
"eval_overall_accuracy": 0.9776347749308564,
"eval_runtime": 8.4116,
"eval_samples_per_second": 30.196,
"eval_steps_per_second": 3.804,
"step": 2125
},
{
"epoch": 17.6,
"grad_norm": 0.7363667488098145,
"learning_rate": 5.3411e-05,
"loss": 0.1046,
"step": 2200
},
{
"epoch": 18.0,
"eval_accuracy_no_text": 0.9800149224455696,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9800149224455696,
"eval_iou_text": 0.0,
"eval_loss": 0.09380830079317093,
"eval_mean_accuracy": 0.9800149224455696,
"eval_mean_iou": 0.4900074612227848,
"eval_overall_accuracy": 0.9800149224455696,
"eval_runtime": 8.0943,
"eval_samples_per_second": 31.38,
"eval_steps_per_second": 3.953,
"step": 2250
},
{
"epoch": 18.4,
"grad_norm": 1.9069602489471436,
"learning_rate": 5.31115e-05,
"loss": 0.1072,
"step": 2300
},
{
"epoch": 19.0,
"eval_accuracy_no_text": 0.9799700770156704,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9799700770156704,
"eval_iou_text": 0.0,
"eval_loss": 0.09618178755044937,
"eval_mean_accuracy": 0.9799700770156704,
"eval_mean_iou": 0.4899850385078352,
"eval_overall_accuracy": 0.9799700770156704,
"eval_runtime": 8.171,
"eval_samples_per_second": 31.086,
"eval_steps_per_second": 3.916,
"step": 2375
},
{
"epoch": 19.2,
"grad_norm": 0.44612982869148254,
"learning_rate": 5.2812e-05,
"loss": 0.1062,
"step": 2400
},
{
"epoch": 20.0,
"grad_norm": 1.044952392578125,
"learning_rate": 5.25125e-05,
"loss": 0.1127,
"step": 2500
},
{
"epoch": 20.0,
"eval_accuracy_no_text": 0.98404203872741,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.98404203872741,
"eval_iou_text": 0.0,
"eval_loss": 0.09183745831251144,
"eval_mean_accuracy": 0.98404203872741,
"eval_mean_iou": 0.492021019363705,
"eval_overall_accuracy": 0.98404203872741,
"eval_runtime": 8.4621,
"eval_samples_per_second": 30.016,
"eval_steps_per_second": 3.782,
"step": 2500
},
{
"epoch": 20.8,
"grad_norm": 3.0239295959472656,
"learning_rate": 5.2213e-05,
"loss": 0.1017,
"step": 2600
},
{
"epoch": 21.0,
"eval_accuracy_no_text": 0.9781973615966435,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9781973615966435,
"eval_iou_text": 0.0,
"eval_loss": 0.09400010854005814,
"eval_mean_accuracy": 0.9781973615966435,
"eval_mean_iou": 0.48909868079832175,
"eval_overall_accuracy": 0.9781973615966435,
"eval_runtime": 8.2162,
"eval_samples_per_second": 30.915,
"eval_steps_per_second": 3.895,
"step": 2625
},
{
"epoch": 21.6,
"grad_norm": 1.0735955238342285,
"learning_rate": 5.1913500000000004e-05,
"loss": 0.0961,
"step": 2700
},
{
"epoch": 22.0,
"eval_accuracy_no_text": 0.9784010685142297,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9784010685142297,
"eval_iou_text": 0.0,
"eval_loss": 0.09638506919145584,
"eval_mean_accuracy": 0.9784010685142297,
"eval_mean_iou": 0.48920053425711485,
"eval_overall_accuracy": 0.9784010685142297,
"eval_runtime": 8.6739,
"eval_samples_per_second": 29.283,
"eval_steps_per_second": 3.689,
"step": 2750
},
{
"epoch": 22.4,
"grad_norm": 0.7935839891433716,
"learning_rate": 5.1614000000000004e-05,
"loss": 0.0951,
"step": 2800
},
{
"epoch": 23.0,
"eval_accuracy_no_text": 0.9820980998348329,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9820980998348329,
"eval_iou_text": 0.0,
"eval_loss": 0.09395471215248108,
"eval_mean_accuracy": 0.9820980998348329,
"eval_mean_iou": 0.49104904991741644,
"eval_overall_accuracy": 0.9820980998348329,
"eval_runtime": 8.6006,
"eval_samples_per_second": 29.533,
"eval_steps_per_second": 3.721,
"step": 2875
},
{
"epoch": 23.2,
"grad_norm": 1.0572441816329956,
"learning_rate": 5.13145e-05,
"loss": 0.101,
"step": 2900
},
{
"epoch": 24.0,
"grad_norm": 0.9966760873794556,
"learning_rate": 5.1015e-05,
"loss": 0.0938,
"step": 3000
},
{
"epoch": 24.0,
"eval_accuracy_no_text": 0.983619405027922,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.983619405027922,
"eval_iou_text": 0.0,
"eval_loss": 0.10053908079862595,
"eval_mean_accuracy": 0.983619405027922,
"eval_mean_iou": 0.491809702513961,
"eval_overall_accuracy": 0.983619405027922,
"eval_runtime": 8.5467,
"eval_samples_per_second": 29.719,
"eval_steps_per_second": 3.744,
"step": 3000
},
{
"epoch": 24.8,
"grad_norm": 1.7212049961090088,
"learning_rate": 5.07155e-05,
"loss": 0.0949,
"step": 3100
},
{
"epoch": 25.0,
"eval_accuracy_no_text": 0.9802790768155358,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9802790768155358,
"eval_iou_text": 0.0,
"eval_loss": 0.10030657052993774,
"eval_mean_accuracy": 0.9802790768155358,
"eval_mean_iou": 0.4901395384077679,
"eval_overall_accuracy": 0.9802790768155358,
"eval_runtime": 8.5434,
"eval_samples_per_second": 29.731,
"eval_steps_per_second": 3.746,
"step": 3125
},
{
"epoch": 25.6,
"grad_norm": 0.9479594230651855,
"learning_rate": 5.0416e-05,
"loss": 0.0949,
"step": 3200
},
{
"epoch": 26.0,
"eval_accuracy_no_text": 0.9815445520404297,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9815445520404297,
"eval_iou_text": 0.0,
"eval_loss": 0.10147000104188919,
"eval_mean_accuracy": 0.9815445520404297,
"eval_mean_iou": 0.49077227602021484,
"eval_overall_accuracy": 0.9815445520404297,
"eval_runtime": 8.3101,
"eval_samples_per_second": 30.565,
"eval_steps_per_second": 3.851,
"step": 3250
},
{
"epoch": 26.4,
"grad_norm": 2.8663785457611084,
"learning_rate": 5.01165e-05,
"loss": 0.0949,
"step": 3300
},
{
"epoch": 27.0,
"eval_accuracy_no_text": 0.9779668869919259,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9779668869919259,
"eval_iou_text": 0.0,
"eval_loss": 0.0970182940363884,
"eval_mean_accuracy": 0.9779668869919259,
"eval_mean_iou": 0.48898344349596295,
"eval_overall_accuracy": 0.9779668869919259,
"eval_runtime": 8.507,
"eval_samples_per_second": 29.858,
"eval_steps_per_second": 3.762,
"step": 3375
},
{
"epoch": 27.2,
"grad_norm": 0.29338690638542175,
"learning_rate": 5.15e-05,
"loss": 0.0977,
"step": 3400
},
{
"epoch": 28.0,
"grad_norm": 0.5164900422096252,
"learning_rate": 5.125e-05,
"loss": 0.0883,
"step": 3500
},
{
"epoch": 28.0,
"eval_accuracy_no_text": 0.9779090481844123,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9779090481844123,
"eval_iou_text": 0.0,
"eval_loss": 0.09671156853437424,
"eval_mean_accuracy": 0.9779090481844123,
"eval_mean_iou": 0.48895452409220613,
"eval_overall_accuracy": 0.9779090481844123,
"eval_runtime": 8.4255,
"eval_samples_per_second": 30.147,
"eval_steps_per_second": 3.798,
"step": 3500
},
{
"epoch": 28.8,
"grad_norm": 0.9270356893539429,
"learning_rate": 5.1e-05,
"loss": 0.0846,
"step": 3600
},
{
"epoch": 29.0,
"eval_accuracy_no_text": 0.984867849291109,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.984867849291109,
"eval_iou_text": 0.0,
"eval_loss": 0.09728837013244629,
"eval_mean_accuracy": 0.984867849291109,
"eval_mean_iou": 0.4924339246455545,
"eval_overall_accuracy": 0.984867849291109,
"eval_runtime": 8.3583,
"eval_samples_per_second": 30.389,
"eval_steps_per_second": 3.829,
"step": 3625
},
{
"epoch": 29.6,
"grad_norm": 54.255714416503906,
"learning_rate": 5.075000000000001e-05,
"loss": 0.0842,
"step": 3700
},
{
"epoch": 30.0,
"eval_accuracy_no_text": 0.9820055344810097,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9820055344810097,
"eval_iou_text": 0.0,
"eval_loss": 0.0946170911192894,
"eval_mean_accuracy": 0.9820055344810097,
"eval_mean_iou": 0.49100276724050484,
"eval_overall_accuracy": 0.9820055344810097,
"eval_runtime": 8.1044,
"eval_samples_per_second": 31.341,
"eval_steps_per_second": 3.948,
"step": 3750
},
{
"epoch": 30.4,
"grad_norm": 0.4858163297176361,
"learning_rate": 5.050000000000001e-05,
"loss": 0.0814,
"step": 3800
},
{
"epoch": 31.0,
"eval_accuracy_no_text": 0.9818622916313758,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9818622916313758,
"eval_iou_text": 0.0,
"eval_loss": 0.09355071932077408,
"eval_mean_accuracy": 0.9818622916313758,
"eval_mean_iou": 0.4909311458156879,
"eval_overall_accuracy": 0.9818622916313758,
"eval_runtime": 8.3948,
"eval_samples_per_second": 30.257,
"eval_steps_per_second": 3.812,
"step": 3875
},
{
"epoch": 31.2,
"grad_norm": 0.7054563760757446,
"learning_rate": 5.0249999999999995e-05,
"loss": 0.082,
"step": 3900
},
{
"epoch": 32.0,
"grad_norm": 1.9450538158416748,
"learning_rate": 5e-05,
"loss": 0.0813,
"step": 4000
},
{
"epoch": 32.0,
"eval_accuracy_no_text": 0.9812941719799806,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9812941719799806,
"eval_iou_text": 0.0,
"eval_loss": 0.09379926323890686,
"eval_mean_accuracy": 0.9812941719799806,
"eval_mean_iou": 0.4906470859899903,
"eval_overall_accuracy": 0.9812941719799806,
"eval_runtime": 8.3235,
"eval_samples_per_second": 30.516,
"eval_steps_per_second": 3.845,
"step": 4000
},
{
"epoch": 32.8,
"grad_norm": 0.48973309993743896,
"learning_rate": 4.975e-05,
"loss": 0.0817,
"step": 4100
},
{
"epoch": 33.0,
"eval_accuracy_no_text": 0.9812250511988094,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9812250511988094,
"eval_iou_text": 0.0,
"eval_loss": 0.09455174952745438,
"eval_mean_accuracy": 0.9812250511988094,
"eval_mean_iou": 0.4906125255994047,
"eval_overall_accuracy": 0.9812250511988094,
"eval_runtime": 8.2561,
"eval_samples_per_second": 30.765,
"eval_steps_per_second": 3.876,
"step": 4125
},
{
"epoch": 33.6,
"grad_norm": 1.3802294731140137,
"learning_rate": 4.95e-05,
"loss": 0.0836,
"step": 4200
},
{
"epoch": 34.0,
"eval_accuracy_no_text": 0.9775148603448678,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9775148603448678,
"eval_iou_text": 0.0,
"eval_loss": 0.0939713567495346,
"eval_mean_accuracy": 0.9775148603448678,
"eval_mean_iou": 0.4887574301724339,
"eval_overall_accuracy": 0.9775148603448678,
"eval_runtime": 8.2502,
"eval_samples_per_second": 30.787,
"eval_steps_per_second": 3.879,
"step": 4250
},
{
"epoch": 34.4,
"grad_norm": 3.26483416557312,
"learning_rate": 4.925e-05,
"loss": 0.0836,
"step": 4300
},
{
"epoch": 35.0,
"eval_accuracy_no_text": 0.9811469413929715,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9811469413929715,
"eval_iou_text": 0.0,
"eval_loss": 0.09151175618171692,
"eval_mean_accuracy": 0.9811469413929715,
"eval_mean_iou": 0.49057347069648577,
"eval_overall_accuracy": 0.9811469413929715,
"eval_runtime": 8.2647,
"eval_samples_per_second": 30.733,
"eval_steps_per_second": 3.872,
"step": 4375
},
{
"epoch": 35.2,
"grad_norm": 1.5455337762832642,
"learning_rate": 4.9e-05,
"loss": 0.0784,
"step": 4400
},
{
"epoch": 36.0,
"grad_norm": 3.040316581726074,
"learning_rate": 4.875e-05,
"loss": 0.0785,
"step": 4500
},
{
"epoch": 36.0,
"eval_accuracy_no_text": 0.9815795942826148,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9815795942826148,
"eval_iou_text": 0.0,
"eval_loss": 0.09513239562511444,
"eval_mean_accuracy": 0.9815795942826148,
"eval_mean_iou": 0.4907897971413074,
"eval_overall_accuracy": 0.9815795942826148,
"eval_runtime": 8.2374,
"eval_samples_per_second": 30.835,
"eval_steps_per_second": 3.885,
"step": 4500
},
{
"epoch": 36.8,
"grad_norm": 2.6754534244537354,
"learning_rate": 4.85e-05,
"loss": 0.0746,
"step": 4600
},
{
"epoch": 37.0,
"eval_accuracy_no_text": 0.9757280549204483,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9757280549204483,
"eval_iou_text": 0.0,
"eval_loss": 0.0951041430234909,
"eval_mean_accuracy": 0.9757280549204483,
"eval_mean_iou": 0.48786402746022417,
"eval_overall_accuracy": 0.9757280549204483,
"eval_runtime": 8.2295,
"eval_samples_per_second": 30.864,
"eval_steps_per_second": 3.888,
"step": 4625
},
{
"epoch": 37.6,
"grad_norm": 0.629497766494751,
"learning_rate": 4.825000000000001e-05,
"loss": 0.0819,
"step": 4700
},
{
"epoch": 38.0,
"eval_accuracy_no_text": 0.9800142910538185,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9800142910538185,
"eval_iou_text": 0.0,
"eval_loss": 0.09518762677907944,
"eval_mean_accuracy": 0.9800142910538185,
"eval_mean_iou": 0.49000714552690927,
"eval_overall_accuracy": 0.9800142910538185,
"eval_runtime": 8.1766,
"eval_samples_per_second": 31.064,
"eval_steps_per_second": 3.914,
"step": 4750
},
{
"epoch": 38.4,
"grad_norm": 0.9247422218322754,
"learning_rate": 4.7999999999999994e-05,
"loss": 0.0731,
"step": 4800
},
{
"epoch": 39.0,
"eval_accuracy_no_text": 0.9797100599232311,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9797100599232311,
"eval_iou_text": 0.0,
"eval_loss": 0.09217899292707443,
"eval_mean_accuracy": 0.9797100599232311,
"eval_mean_iou": 0.48985502996161556,
"eval_overall_accuracy": 0.9797100599232311,
"eval_runtime": 8.1339,
"eval_samples_per_second": 31.227,
"eval_steps_per_second": 3.934,
"step": 4875
},
{
"epoch": 39.2,
"grad_norm": 0.5285217761993408,
"learning_rate": 4.775e-05,
"loss": 0.0826,
"step": 4900
},
{
"epoch": 40.0,
"grad_norm": 0.7555281519889832,
"learning_rate": 4.75e-05,
"loss": 0.0745,
"step": 5000
},
{
"epoch": 40.0,
"eval_accuracy_no_text": 0.9798135915548363,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9798135915548363,
"eval_iou_text": 0.0,
"eval_loss": 0.09387236088514328,
"eval_mean_accuracy": 0.9798135915548363,
"eval_mean_iou": 0.48990679577741814,
"eval_overall_accuracy": 0.9798135915548363,
"eval_runtime": 8.2225,
"eval_samples_per_second": 30.891,
"eval_steps_per_second": 3.892,
"step": 5000
},
{
"epoch": 40.8,
"grad_norm": 0.6379430294036865,
"learning_rate": 4.7249999999999997e-05,
"loss": 0.0755,
"step": 5100
},
{
"epoch": 41.0,
"eval_accuracy_no_text": 0.980224079270902,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.980224079270902,
"eval_iou_text": 0.0,
"eval_loss": 0.094584159553051,
"eval_mean_accuracy": 0.980224079270902,
"eval_mean_iou": 0.490112039635451,
"eval_overall_accuracy": 0.980224079270902,
"eval_runtime": 8.2271,
"eval_samples_per_second": 30.874,
"eval_steps_per_second": 3.89,
"step": 5125
},
{
"epoch": 41.6,
"grad_norm": 0.8154006004333496,
"learning_rate": 4.7000000000000004e-05,
"loss": 0.0692,
"step": 5200
},
{
"epoch": 42.0,
"eval_accuracy_no_text": 0.975735365772303,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.975735365772303,
"eval_iou_text": 0.0,
"eval_loss": 0.09759368002414703,
"eval_mean_accuracy": 0.975735365772303,
"eval_mean_iou": 0.4878676828861515,
"eval_overall_accuracy": 0.975735365772303,
"eval_runtime": 8.4223,
"eval_samples_per_second": 30.158,
"eval_steps_per_second": 3.799,
"step": 5250
},
{
"epoch": 42.4,
"grad_norm": 0.7524943351745605,
"learning_rate": 4.6750000000000005e-05,
"loss": 0.0798,
"step": 5300
},
{
"epoch": 43.0,
"eval_accuracy_no_text": 0.9804404638702271,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9804404638702271,
"eval_iou_text": 0.0,
"eval_loss": 0.09877783805131912,
"eval_mean_accuracy": 0.9804404638702271,
"eval_mean_iou": 0.49022023193511355,
"eval_overall_accuracy": 0.9804404638702271,
"eval_runtime": 8.2237,
"eval_samples_per_second": 30.886,
"eval_steps_per_second": 3.891,
"step": 5375
},
{
"epoch": 43.2,
"grad_norm": 0.3496994972229004,
"learning_rate": 4.6500000000000005e-05,
"loss": 0.072,
"step": 5400
},
{
"epoch": 44.0,
"grad_norm": 1.7848222255706787,
"learning_rate": 4.625e-05,
"loss": 0.076,
"step": 5500
},
{
"epoch": 44.0,
"eval_accuracy_no_text": 0.9797547724285511,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9797547724285511,
"eval_iou_text": 0.0,
"eval_loss": 0.09654530137777328,
"eval_mean_accuracy": 0.9797547724285511,
"eval_mean_iou": 0.48987738621427557,
"eval_overall_accuracy": 0.9797547724285511,
"eval_runtime": 8.1971,
"eval_samples_per_second": 30.987,
"eval_steps_per_second": 3.904,
"step": 5500
},
{
"epoch": 44.8,
"grad_norm": 0.5874524712562561,
"learning_rate": 4.600000000000001e-05,
"loss": 0.0757,
"step": 5600
},
{
"epoch": 45.0,
"eval_accuracy_no_text": 0.9823000122706003,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9823000122706003,
"eval_iou_text": 0.0,
"eval_loss": 0.09140286594629288,
"eval_mean_accuracy": 0.9823000122706003,
"eval_mean_iou": 0.49115000613530013,
"eval_overall_accuracy": 0.9823000122706003,
"eval_runtime": 8.2597,
"eval_samples_per_second": 30.752,
"eval_steps_per_second": 3.874,
"step": 5625
},
{
"epoch": 45.6,
"grad_norm": 0.46248531341552734,
"learning_rate": 4.575000000000001e-05,
"loss": 0.0702,
"step": 5700
},
{
"epoch": 46.0,
"eval_accuracy_no_text": 0.9780766660787523,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9780766660787523,
"eval_iou_text": 0.0,
"eval_loss": 0.09352780878543854,
"eval_mean_accuracy": 0.9780766660787523,
"eval_mean_iou": 0.48903833303937616,
"eval_overall_accuracy": 0.9780766660787523,
"eval_runtime": 8.3183,
"eval_samples_per_second": 30.535,
"eval_steps_per_second": 3.847,
"step": 5750
},
{
"epoch": 46.4,
"grad_norm": 1.1901108026504517,
"learning_rate": 4.55e-05,
"loss": 0.0765,
"step": 5800
},
{
"epoch": 47.0,
"eval_accuracy_no_text": 0.9809388645798449,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9809388645798449,
"eval_iou_text": 0.0,
"eval_loss": 0.09659279137849808,
"eval_mean_accuracy": 0.9809388645798449,
"eval_mean_iou": 0.49046943228992246,
"eval_overall_accuracy": 0.9809388645798449,
"eval_runtime": 8.247,
"eval_samples_per_second": 30.799,
"eval_steps_per_second": 3.88,
"step": 5875
},
{
"epoch": 47.2,
"grad_norm": 0.2969698905944824,
"learning_rate": 4.525000000000001e-05,
"loss": 0.0722,
"step": 5900
},
{
"epoch": 48.0,
"grad_norm": 5.192142486572266,
"learning_rate": 4.5e-05,
"loss": 0.0724,
"step": 6000
},
{
"epoch": 48.0,
"eval_accuracy_no_text": 0.9832674872045554,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9832674872045554,
"eval_iou_text": 0.0,
"eval_loss": 0.09365521371364594,
"eval_mean_accuracy": 0.9832674872045554,
"eval_mean_iou": 0.4916337436022777,
"eval_overall_accuracy": 0.9832674872045554,
"eval_runtime": 8.1901,
"eval_samples_per_second": 31.013,
"eval_steps_per_second": 3.907,
"step": 6000
},
{
"epoch": 48.8,
"grad_norm": 0.8341678380966187,
"learning_rate": 4.4750000000000004e-05,
"loss": 0.0713,
"step": 6100
},
{
"epoch": 49.0,
"eval_accuracy_no_text": 0.9761614388952771,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9761614388952771,
"eval_iou_text": 0.0,
"eval_loss": 0.10168309509754181,
"eval_mean_accuracy": 0.9761614388952771,
"eval_mean_iou": 0.48808071944763853,
"eval_overall_accuracy": 0.9761614388952771,
"eval_runtime": 8.2425,
"eval_samples_per_second": 30.816,
"eval_steps_per_second": 3.882,
"step": 6125
},
{
"epoch": 49.6,
"grad_norm": 1.4235390424728394,
"learning_rate": 4.4500000000000004e-05,
"loss": 0.0677,
"step": 6200
},
{
"epoch": 50.0,
"eval_accuracy_no_text": 0.9803571201590842,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9803571201590842,
"eval_iou_text": 0.0,
"eval_loss": 0.09322305768728256,
"eval_mean_accuracy": 0.9803571201590842,
"eval_mean_iou": 0.4901785600795421,
"eval_overall_accuracy": 0.9803571201590842,
"eval_runtime": 8.1322,
"eval_samples_per_second": 31.234,
"eval_steps_per_second": 3.935,
"step": 6250
},
{
"epoch": 50.4,
"grad_norm": 4.009937763214111,
"learning_rate": 4.4250000000000005e-05,
"loss": 0.0715,
"step": 6300
},
{
"epoch": 51.0,
"eval_accuracy_no_text": 0.9781054442501438,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9781054442501438,
"eval_iou_text": 0.0,
"eval_loss": 0.09748787432909012,
"eval_mean_accuracy": 0.9781054442501438,
"eval_mean_iou": 0.4890527221250719,
"eval_overall_accuracy": 0.9781054442501438,
"eval_runtime": 8.3284,
"eval_samples_per_second": 30.498,
"eval_steps_per_second": 3.842,
"step": 6375
},
{
"epoch": 51.2,
"grad_norm": 0.7396467328071594,
"learning_rate": 4.4e-05,
"loss": 0.07,
"step": 6400
},
{
"epoch": 52.0,
"grad_norm": 0.4652855694293976,
"learning_rate": 4.3750000000000006e-05,
"loss": 0.0713,
"step": 6500
},
{
"epoch": 52.0,
"eval_accuracy_no_text": 0.9833075639651767,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9833075639651767,
"eval_iou_text": 0.0,
"eval_loss": 0.09451069682836533,
"eval_mean_accuracy": 0.9833075639651767,
"eval_mean_iou": 0.49165378198258836,
"eval_overall_accuracy": 0.9833075639651767,
"eval_runtime": 8.2755,
"eval_samples_per_second": 30.693,
"eval_steps_per_second": 3.867,
"step": 6500
},
{
"epoch": 52.8,
"grad_norm": 0.32952389121055603,
"learning_rate": 4.35e-05,
"loss": 0.0695,
"step": 6600
},
{
"epoch": 53.0,
"eval_accuracy_no_text": 0.9819285545340948,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9819285545340948,
"eval_iou_text": 0.0,
"eval_loss": 0.09514930099248886,
"eval_mean_accuracy": 0.9819285545340948,
"eval_mean_iou": 0.4909642772670474,
"eval_overall_accuracy": 0.9819285545340948,
"eval_runtime": 8.5513,
"eval_samples_per_second": 29.703,
"eval_steps_per_second": 3.742,
"step": 6625
},
{
"epoch": 53.6,
"grad_norm": 1.479300856590271,
"learning_rate": 4.325e-05,
"loss": 0.0648,
"step": 6700
},
{
"epoch": 54.0,
"eval_accuracy_no_text": 0.9824639248922958,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9824639248922958,
"eval_iou_text": 0.0,
"eval_loss": 0.09646683931350708,
"eval_mean_accuracy": 0.9824639248922958,
"eval_mean_iou": 0.4912319624461479,
"eval_overall_accuracy": 0.9824639248922958,
"eval_runtime": 8.3734,
"eval_samples_per_second": 30.334,
"eval_steps_per_second": 3.822,
"step": 6750
},
{
"epoch": 54.4,
"grad_norm": 0.37164923548698425,
"learning_rate": 4.3e-05,
"loss": 0.0694,
"step": 6800
},
{
"epoch": 55.0,
"eval_accuracy_no_text": 0.9809235284065225,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9809235284065225,
"eval_iou_text": 0.0,
"eval_loss": 0.09463436901569366,
"eval_mean_accuracy": 0.9809235284065225,
"eval_mean_iou": 0.49046176420326126,
"eval_overall_accuracy": 0.9809235284065225,
"eval_runtime": 8.3659,
"eval_samples_per_second": 30.361,
"eval_steps_per_second": 3.825,
"step": 6875
},
{
"epoch": 55.2,
"grad_norm": 0.3387889862060547,
"learning_rate": 4.275e-05,
"loss": 0.0658,
"step": 6900
},
{
"epoch": 56.0,
"grad_norm": 0.8153048157691956,
"learning_rate": 4.25e-05,
"loss": 0.0665,
"step": 7000
},
{
"epoch": 56.0,
"eval_accuracy_no_text": 0.9824437868185507,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9824437868185507,
"eval_iou_text": 0.0,
"eval_loss": 0.1007036343216896,
"eval_mean_accuracy": 0.9824437868185507,
"eval_mean_iou": 0.49122189340927536,
"eval_overall_accuracy": 0.9824437868185507,
"eval_runtime": 8.3927,
"eval_samples_per_second": 30.265,
"eval_steps_per_second": 3.813,
"step": 7000
},
{
"epoch": 56.8,
"grad_norm": 0.8299281001091003,
"learning_rate": 4.225e-05,
"loss": 0.0635,
"step": 7100
},
{
"epoch": 57.0,
"eval_accuracy_no_text": 0.9831196252257952,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9831196252257952,
"eval_iou_text": 0.0,
"eval_loss": 0.09709285199642181,
"eval_mean_accuracy": 0.9831196252257952,
"eval_mean_iou": 0.4915598126128976,
"eval_overall_accuracy": 0.9831196252257952,
"eval_runtime": 8.2632,
"eval_samples_per_second": 30.739,
"eval_steps_per_second": 3.873,
"step": 7125
},
{
"epoch": 57.6,
"grad_norm": 0.6725646257400513,
"learning_rate": 4.2000000000000004e-05,
"loss": 0.0628,
"step": 7200
},
{
"epoch": 58.0,
"eval_accuracy_no_text": 0.9785253031490414,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9785253031490414,
"eval_iou_text": 0.0,
"eval_loss": 0.10017971694469452,
"eval_mean_accuracy": 0.9785253031490414,
"eval_mean_iou": 0.4892626515745207,
"eval_overall_accuracy": 0.9785253031490414,
"eval_runtime": 8.2012,
"eval_samples_per_second": 30.971,
"eval_steps_per_second": 3.902,
"step": 7250
},
{
"epoch": 58.4,
"grad_norm": 0.5249119400978088,
"learning_rate": 4.175e-05,
"loss": 0.0668,
"step": 7300
},
{
"epoch": 59.0,
"eval_accuracy_no_text": 0.9812511708786174,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9812511708786174,
"eval_iou_text": 0.0,
"eval_loss": 0.09598462283611298,
"eval_mean_accuracy": 0.9812511708786174,
"eval_mean_iou": 0.4906255854393087,
"eval_overall_accuracy": 0.9812511708786174,
"eval_runtime": 8.1994,
"eval_samples_per_second": 30.978,
"eval_steps_per_second": 3.903,
"step": 7375
},
{
"epoch": 59.2,
"grad_norm": 0.7958447933197021,
"learning_rate": 4.15e-05,
"loss": 0.0688,
"step": 7400
},
{
"epoch": 60.0,
"grad_norm": 0.3779708743095398,
"learning_rate": 4.125e-05,
"loss": 0.0648,
"step": 7500
},
{
"epoch": 60.0,
"eval_accuracy_no_text": 0.9796383969594832,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9796383969594832,
"eval_iou_text": 0.0,
"eval_loss": 0.0938754603266716,
"eval_mean_accuracy": 0.9796383969594832,
"eval_mean_iou": 0.4898191984797416,
"eval_overall_accuracy": 0.9796383969594832,
"eval_runtime": 8.2596,
"eval_samples_per_second": 30.752,
"eval_steps_per_second": 3.874,
"step": 7500
},
{
"epoch": 60.8,
"grad_norm": 0.30460646748542786,
"learning_rate": 4.1e-05,
"loss": 0.064,
"step": 7600
},
{
"epoch": 61.0,
"eval_accuracy_no_text": 0.9785537157778401,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9785537157778401,
"eval_iou_text": 0.0,
"eval_loss": 0.09466074407100677,
"eval_mean_accuracy": 0.9785537157778401,
"eval_mean_iou": 0.48927685788892006,
"eval_overall_accuracy": 0.9785537157778401,
"eval_runtime": 8.2318,
"eval_samples_per_second": 30.856,
"eval_steps_per_second": 3.887,
"step": 7625
},
{
"epoch": 61.6,
"grad_norm": 1.3763538599014282,
"learning_rate": 4.0749999999999994e-05,
"loss": 0.0636,
"step": 7700
},
{
"epoch": 62.0,
"eval_accuracy_no_text": 0.9788354161922574,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9788354161922574,
"eval_iou_text": 0.0,
"eval_loss": 0.09854825586080551,
"eval_mean_accuracy": 0.9788354161922574,
"eval_mean_iou": 0.4894177080961287,
"eval_overall_accuracy": 0.9788354161922574,
"eval_runtime": 8.1667,
"eval_samples_per_second": 31.102,
"eval_steps_per_second": 3.918,
"step": 7750
},
{
"epoch": 62.4,
"grad_norm": 0.5202354788780212,
"learning_rate": 4.05e-05,
"loss": 0.0653,
"step": 7800
},
{
"epoch": 63.0,
"eval_accuracy_no_text": 0.9812044645046096,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9812044645046096,
"eval_iou_text": 0.0,
"eval_loss": 0.0914328396320343,
"eval_mean_accuracy": 0.9812044645046096,
"eval_mean_iou": 0.4906022322523048,
"eval_overall_accuracy": 0.9812044645046096,
"eval_runtime": 8.3443,
"eval_samples_per_second": 30.44,
"eval_steps_per_second": 3.835,
"step": 7875
},
{
"epoch": 63.2,
"grad_norm": 0.6701187491416931,
"learning_rate": 4.0249999999999996e-05,
"loss": 0.061,
"step": 7900
},
{
"epoch": 64.0,
"grad_norm": 0.389220654964447,
"learning_rate": 3.9999999999999996e-05,
"loss": 0.0594,
"step": 8000
},
{
"epoch": 64.0,
"eval_accuracy_no_text": 0.9782057192295591,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9782057192295591,
"eval_iou_text": 0.0,
"eval_loss": 0.09664972871541977,
"eval_mean_accuracy": 0.9782057192295591,
"eval_mean_iou": 0.48910285961477956,
"eval_overall_accuracy": 0.9782057192295591,
"eval_runtime": 8.3923,
"eval_samples_per_second": 30.266,
"eval_steps_per_second": 3.813,
"step": 8000
},
{
"epoch": 64.8,
"grad_norm": 0.408395379781723,
"learning_rate": 3.975e-05,
"loss": 0.0608,
"step": 8100
},
{
"epoch": 65.0,
"eval_accuracy_no_text": 0.9794022730601506,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9794022730601506,
"eval_iou_text": 0.0,
"eval_loss": 0.09610570222139359,
"eval_mean_accuracy": 0.9794022730601506,
"eval_mean_iou": 0.4897011365300753,
"eval_overall_accuracy": 0.9794022730601506,
"eval_runtime": 8.4338,
"eval_samples_per_second": 30.117,
"eval_steps_per_second": 3.794,
"step": 8125
},
{
"epoch": 65.6,
"grad_norm": 0.7247848510742188,
"learning_rate": 3.9500000000000005e-05,
"loss": 0.0625,
"step": 8200
},
{
"epoch": 66.0,
"eval_accuracy_no_text": 0.9813712682359023,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9813712682359023,
"eval_iou_text": 0.0,
"eval_loss": 0.09536296874284744,
"eval_mean_accuracy": 0.9813712682359023,
"eval_mean_iou": 0.49068563411795113,
"eval_overall_accuracy": 0.9813712682359023,
"eval_runtime": 8.3567,
"eval_samples_per_second": 30.395,
"eval_steps_per_second": 3.829,
"step": 8250
},
{
"epoch": 66.4,
"grad_norm": 0.7799036502838135,
"learning_rate": 3.924999999999999e-05,
"loss": 0.0646,
"step": 8300
},
{
"epoch": 67.0,
"eval_accuracy_no_text": 0.9800713489294296,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9800713489294296,
"eval_iou_text": 0.0,
"eval_loss": 0.09814047813415527,
"eval_mean_accuracy": 0.9800713489294296,
"eval_mean_iou": 0.4900356744647148,
"eval_overall_accuracy": 0.9800713489294296,
"eval_runtime": 8.317,
"eval_samples_per_second": 30.54,
"eval_steps_per_second": 3.848,
"step": 8375
},
{
"epoch": 67.2,
"grad_norm": 0.9421979188919067,
"learning_rate": 3.9e-05,
"loss": 0.0616,
"step": 8400
},
{
"epoch": 68.0,
"grad_norm": 0.7759032249450684,
"learning_rate": 3.874999999999999e-05,
"loss": 0.0634,
"step": 8500
},
{
"epoch": 68.0,
"eval_accuracy_no_text": 0.9822642223276573,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9822642223276573,
"eval_iou_text": 0.0,
"eval_loss": 0.09961166232824326,
"eval_mean_accuracy": 0.9822642223276573,
"eval_mean_iou": 0.49113211116382866,
"eval_overall_accuracy": 0.9822642223276573,
"eval_runtime": 8.4898,
"eval_samples_per_second": 29.918,
"eval_steps_per_second": 3.769,
"step": 8500
},
{
"epoch": 68.8,
"grad_norm": 0.9563459753990173,
"learning_rate": 3.850000000000001e-05,
"loss": 0.0611,
"step": 8600
},
{
"epoch": 69.0,
"eval_accuracy_no_text": 0.981046533488977,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.981046533488977,
"eval_iou_text": 0.0,
"eval_loss": 0.10069240629673004,
"eval_mean_accuracy": 0.981046533488977,
"eval_mean_iou": 0.4905232667444885,
"eval_overall_accuracy": 0.981046533488977,
"eval_runtime": 8.3357,
"eval_samples_per_second": 30.472,
"eval_steps_per_second": 3.839,
"step": 8625
},
{
"epoch": 69.6,
"grad_norm": 0.3676619231700897,
"learning_rate": 3.825e-05,
"loss": 0.0599,
"step": 8700
},
{
"epoch": 70.0,
"eval_accuracy_no_text": 0.9792718242012625,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9792718242012625,
"eval_iou_text": 0.0,
"eval_loss": 0.09285294264554977,
"eval_mean_accuracy": 0.9792718242012625,
"eval_mean_iou": 0.48963591210063123,
"eval_overall_accuracy": 0.9792718242012625,
"eval_runtime": 8.2408,
"eval_samples_per_second": 30.822,
"eval_steps_per_second": 3.883,
"step": 8750
},
{
"epoch": 70.4,
"grad_norm": 0.6337301135063171,
"learning_rate": 3.800000000000001e-05,
"loss": 0.0583,
"step": 8800
},
{
"epoch": 71.0,
"eval_accuracy_no_text": 0.9825129740620114,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9825129740620114,
"eval_iou_text": 0.0,
"eval_loss": 0.09883657097816467,
"eval_mean_accuracy": 0.9825129740620114,
"eval_mean_iou": 0.4912564870310057,
"eval_overall_accuracy": 0.9825129740620114,
"eval_runtime": 8.1683,
"eval_samples_per_second": 31.096,
"eval_steps_per_second": 3.918,
"step": 8875
},
{
"epoch": 71.2,
"grad_norm": 1.0939313173294067,
"learning_rate": 3.7749999999999996e-05,
"loss": 0.0618,
"step": 8900
},
{
"epoch": 72.0,
"grad_norm": 0.729832112789154,
"learning_rate": 3.7500000000000003e-05,
"loss": 0.0596,
"step": 9000
},
{
"epoch": 72.0,
"eval_accuracy_no_text": 0.9790404523556354,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9790404523556354,
"eval_iou_text": 0.0,
"eval_loss": 0.09549351781606674,
"eval_mean_accuracy": 0.9790404523556354,
"eval_mean_iou": 0.4895202261778177,
"eval_overall_accuracy": 0.9790404523556354,
"eval_runtime": 8.3006,
"eval_samples_per_second": 30.6,
"eval_steps_per_second": 3.855,
"step": 9000
},
{
"epoch": 72.8,
"grad_norm": 0.31644830107688904,
"learning_rate": 3.725e-05,
"loss": 0.0598,
"step": 9100
},
{
"epoch": 73.0,
"eval_accuracy_no_text": 0.9799757761570025,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9799757761570025,
"eval_iou_text": 0.0,
"eval_loss": 0.10248930752277374,
"eval_mean_accuracy": 0.9799757761570025,
"eval_mean_iou": 0.48998788807850124,
"eval_overall_accuracy": 0.9799757761570025,
"eval_runtime": 8.2995,
"eval_samples_per_second": 30.604,
"eval_steps_per_second": 3.856,
"step": 9125
},
{
"epoch": 73.6,
"grad_norm": 0.7597707509994507,
"learning_rate": 3.7000000000000005e-05,
"loss": 0.0623,
"step": 9200
},
{
"epoch": 74.0,
"eval_accuracy_no_text": 0.9836081064386921,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9836081064386921,
"eval_iou_text": 0.0,
"eval_loss": 0.09970316290855408,
"eval_mean_accuracy": 0.9836081064386921,
"eval_mean_iou": 0.49180405321934606,
"eval_overall_accuracy": 0.9836081064386921,
"eval_runtime": 8.2563,
"eval_samples_per_second": 30.764,
"eval_steps_per_second": 3.876,
"step": 9250
},
{
"epoch": 74.4,
"grad_norm": 1.544348955154419,
"learning_rate": 3.675e-05,
"loss": 0.0637,
"step": 9300
},
{
"epoch": 75.0,
"eval_accuracy_no_text": 0.9782330019994349,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9782330019994349,
"eval_iou_text": 0.0,
"eval_loss": 0.09712851047515869,
"eval_mean_accuracy": 0.9782330019994349,
"eval_mean_iou": 0.48911650099971743,
"eval_overall_accuracy": 0.9782330019994349,
"eval_runtime": 8.2372,
"eval_samples_per_second": 30.836,
"eval_steps_per_second": 3.885,
"step": 9375
},
{
"epoch": 75.2,
"grad_norm": 1.103569507598877,
"learning_rate": 3.6500000000000006e-05,
"loss": 0.0577,
"step": 9400
},
{
"epoch": 76.0,
"grad_norm": 3.0431878566741943,
"learning_rate": 3.625e-05,
"loss": 0.0627,
"step": 9500
},
{
"epoch": 76.0,
"eval_accuracy_no_text": 0.9806131328985758,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9806131328985758,
"eval_iou_text": 0.0,
"eval_loss": 0.09336179494857788,
"eval_mean_accuracy": 0.9806131328985758,
"eval_mean_iou": 0.4903065664492879,
"eval_overall_accuracy": 0.9806131328985758,
"eval_runtime": 8.3291,
"eval_samples_per_second": 30.496,
"eval_steps_per_second": 3.842,
"step": 9500
},
{
"epoch": 76.8,
"grad_norm": 0.6158745288848877,
"learning_rate": 3.6e-05,
"loss": 0.0566,
"step": 9600
},
{
"epoch": 77.0,
"eval_accuracy_no_text": 0.9830253983147323,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9830253983147323,
"eval_iou_text": 0.0,
"eval_loss": 0.1015550047159195,
"eval_mean_accuracy": 0.9830253983147323,
"eval_mean_iou": 0.4915126991573662,
"eval_overall_accuracy": 0.9830253983147323,
"eval_runtime": 8.1139,
"eval_samples_per_second": 31.304,
"eval_steps_per_second": 3.944,
"step": 9625
},
{
"epoch": 77.6,
"grad_norm": 0.6829688549041748,
"learning_rate": 3.575e-05,
"loss": 0.0585,
"step": 9700
},
{
"epoch": 78.0,
"eval_accuracy_no_text": 0.9816801849579057,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9816801849579057,
"eval_iou_text": 0.0,
"eval_loss": 0.09153465181589127,
"eval_mean_accuracy": 0.9816801849579057,
"eval_mean_iou": 0.4908400924789528,
"eval_overall_accuracy": 0.9816801849579057,
"eval_runtime": 8.1774,
"eval_samples_per_second": 31.061,
"eval_steps_per_second": 3.913,
"step": 9750
},
{
"epoch": 78.4,
"grad_norm": 0.5731038451194763,
"learning_rate": 3.55e-05,
"loss": 0.0574,
"step": 9800
},
{
"epoch": 79.0,
"eval_accuracy_no_text": 0.981351246471164,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.981351246471164,
"eval_iou_text": 0.0,
"eval_loss": 0.09391193091869354,
"eval_mean_accuracy": 0.981351246471164,
"eval_mean_iou": 0.490675623235582,
"eval_overall_accuracy": 0.981351246471164,
"eval_runtime": 8.219,
"eval_samples_per_second": 30.904,
"eval_steps_per_second": 3.893,
"step": 9875
},
{
"epoch": 79.2,
"grad_norm": 0.2290593832731247,
"learning_rate": 3.5249999999999996e-05,
"loss": 0.0561,
"step": 9900
},
{
"epoch": 80.0,
"grad_norm": 0.826732337474823,
"learning_rate": 3.5000000000000004e-05,
"loss": 0.0579,
"step": 10000
},
{
"epoch": 80.0,
"eval_accuracy_no_text": 0.9797084980594257,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9797084980594257,
"eval_iou_text": 0.0,
"eval_loss": 0.0996052473783493,
"eval_mean_accuracy": 0.9797084980594257,
"eval_mean_iou": 0.48985424902971286,
"eval_overall_accuracy": 0.9797084980594257,
"eval_runtime": 8.2761,
"eval_samples_per_second": 30.691,
"eval_steps_per_second": 3.867,
"step": 10000
},
{
"epoch": 80.8,
"grad_norm": 0.6924729943275452,
"learning_rate": 3.4750000000000004e-05,
"loss": 0.0564,
"step": 10100
},
{
"epoch": 81.0,
"eval_accuracy_no_text": 0.9801340560996555,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9801340560996555,
"eval_iou_text": 0.0,
"eval_loss": 0.09884705394506454,
"eval_mean_accuracy": 0.9801340560996555,
"eval_mean_iou": 0.49006702804982777,
"eval_overall_accuracy": 0.9801340560996555,
"eval_runtime": 8.235,
"eval_samples_per_second": 30.844,
"eval_steps_per_second": 3.886,
"step": 10125
},
{
"epoch": 81.6,
"grad_norm": 0.6362507939338684,
"learning_rate": 3.45e-05,
"loss": 0.0614,
"step": 10200
},
{
"epoch": 82.0,
"eval_accuracy_no_text": 0.9835959936864148,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9835959936864148,
"eval_iou_text": 0.0,
"eval_loss": 0.1010938361287117,
"eval_mean_accuracy": 0.9835959936864148,
"eval_mean_iou": 0.4917979968432074,
"eval_overall_accuracy": 0.9835959936864148,
"eval_runtime": 8.1531,
"eval_samples_per_second": 31.154,
"eval_steps_per_second": 3.925,
"step": 10250
},
{
"epoch": 82.4,
"grad_norm": 0.2358619123697281,
"learning_rate": 3.4250000000000006e-05,
"loss": 0.0556,
"step": 10300
},
{
"epoch": 83.0,
"eval_accuracy_no_text": 0.9816712457799561,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9816712457799561,
"eval_iou_text": 0.0,
"eval_loss": 0.09844139963388443,
"eval_mean_accuracy": 0.9816712457799561,
"eval_mean_iou": 0.49083562288997806,
"eval_overall_accuracy": 0.9816712457799561,
"eval_runtime": 8.4411,
"eval_samples_per_second": 30.091,
"eval_steps_per_second": 3.791,
"step": 10375
},
{
"epoch": 83.2,
"grad_norm": 0.4608982801437378,
"learning_rate": 3.4e-05,
"loss": 0.0585,
"step": 10400
},
{
"epoch": 84.0,
"grad_norm": 0.537953794002533,
"learning_rate": 3.3749999999999994e-05,
"loss": 0.0582,
"step": 10500
},
{
"epoch": 84.0,
"eval_accuracy_no_text": 0.9811251916087039,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9811251916087039,
"eval_iou_text": 0.0,
"eval_loss": 0.0963573008775711,
"eval_mean_accuracy": 0.9811251916087039,
"eval_mean_iou": 0.49056259580435196,
"eval_overall_accuracy": 0.9811251916087039,
"eval_runtime": 8.3426,
"eval_samples_per_second": 30.446,
"eval_steps_per_second": 3.836,
"step": 10500
},
{
"epoch": 84.8,
"grad_norm": 0.3407799303531647,
"learning_rate": 3.35e-05,
"loss": 0.057,
"step": 10600
},
{
"epoch": 85.0,
"eval_accuracy_no_text": 0.9821431280360285,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9821431280360285,
"eval_iou_text": 0.0,
"eval_loss": 0.09560161828994751,
"eval_mean_accuracy": 0.9821431280360285,
"eval_mean_iou": 0.4910715640180143,
"eval_overall_accuracy": 0.9821431280360285,
"eval_runtime": 8.3368,
"eval_samples_per_second": 30.467,
"eval_steps_per_second": 3.838,
"step": 10625
},
{
"epoch": 85.6,
"grad_norm": 0.7103127241134644,
"learning_rate": 3.325e-05,
"loss": 0.0552,
"step": 10700
},
{
"epoch": 86.0,
"eval_accuracy_no_text": 0.9803550099813897,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9803550099813897,
"eval_iou_text": 0.0,
"eval_loss": 0.10003025084733963,
"eval_mean_accuracy": 0.9803550099813897,
"eval_mean_iou": 0.49017750499069485,
"eval_overall_accuracy": 0.9803550099813897,
"eval_runtime": 8.3658,
"eval_samples_per_second": 30.362,
"eval_steps_per_second": 3.825,
"step": 10750
},
{
"epoch": 86.4,
"grad_norm": 0.22427453100681305,
"learning_rate": 3.2999999999999996e-05,
"loss": 0.059,
"step": 10800
},
{
"epoch": 87.0,
"eval_accuracy_no_text": 0.9828363297164279,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9828363297164279,
"eval_iou_text": 0.0,
"eval_loss": 0.09896524995565414,
"eval_mean_accuracy": 0.9828363297164279,
"eval_mean_iou": 0.49141816485821394,
"eval_overall_accuracy": 0.9828363297164279,
"eval_runtime": 8.1925,
"eval_samples_per_second": 31.004,
"eval_steps_per_second": 3.906,
"step": 10875
},
{
"epoch": 87.2,
"grad_norm": 0.7796413898468018,
"learning_rate": 3.2749999999999996e-05,
"loss": 0.0596,
"step": 10900
},
{
"epoch": 88.0,
"grad_norm": 0.44246774911880493,
"learning_rate": 3.25e-05,
"loss": 0.0547,
"step": 11000
},
{
"epoch": 88.0,
"eval_accuracy_no_text": 0.981057084377449,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.981057084377449,
"eval_iou_text": 0.0,
"eval_loss": 0.09589246660470963,
"eval_mean_accuracy": 0.981057084377449,
"eval_mean_iou": 0.4905285421887245,
"eval_overall_accuracy": 0.981057084377449,
"eval_runtime": 8.2104,
"eval_samples_per_second": 30.936,
"eval_steps_per_second": 3.898,
"step": 11000
},
{
"epoch": 88.8,
"grad_norm": 0.19626279175281525,
"learning_rate": 3.225e-05,
"loss": 0.0532,
"step": 11100
},
{
"epoch": 89.0,
"eval_accuracy_no_text": 0.9818968520219614,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9818968520219614,
"eval_iou_text": 0.0,
"eval_loss": 0.09797363728284836,
"eval_mean_accuracy": 0.9818968520219614,
"eval_mean_iou": 0.4909484260109807,
"eval_overall_accuracy": 0.9818968520219614,
"eval_runtime": 8.1435,
"eval_samples_per_second": 31.19,
"eval_steps_per_second": 3.929,
"step": 11125
},
{
"epoch": 89.6,
"grad_norm": 1.401407241821289,
"learning_rate": 3.2e-05,
"loss": 0.0578,
"step": 11200
},
{
"epoch": 90.0,
"eval_accuracy_no_text": 0.9829336138928118,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9829336138928118,
"eval_iou_text": 0.0,
"eval_loss": 0.09540460258722305,
"eval_mean_accuracy": 0.9829336138928118,
"eval_mean_iou": 0.4914668069464059,
"eval_overall_accuracy": 0.9829336138928118,
"eval_runtime": 7.9565,
"eval_samples_per_second": 31.924,
"eval_steps_per_second": 4.022,
"step": 11250
},
{
"epoch": 90.4,
"grad_norm": 0.3004220426082611,
"learning_rate": 3.1750000000000006e-05,
"loss": 0.0552,
"step": 11300
},
{
"epoch": 91.0,
"eval_accuracy_no_text": 0.9817473783326788,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9817473783326788,
"eval_iou_text": 0.0,
"eval_loss": 0.10131113231182098,
"eval_mean_accuracy": 0.9817473783326788,
"eval_mean_iou": 0.4908736891663394,
"eval_overall_accuracy": 0.9817473783326788,
"eval_runtime": 7.9524,
"eval_samples_per_second": 31.94,
"eval_steps_per_second": 4.024,
"step": 11375
},
{
"epoch": 91.2,
"grad_norm": 0.3821699321269989,
"learning_rate": 3.15e-05,
"loss": 0.0555,
"step": 11400
},
{
"epoch": 92.0,
"grad_norm": 0.6809713840484619,
"learning_rate": 3.1249999999999994e-05,
"loss": 0.0584,
"step": 11500
},
{
"epoch": 92.0,
"eval_accuracy_no_text": 0.9802022796399172,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9802022796399172,
"eval_iou_text": 0.0,
"eval_loss": 0.09861049801111221,
"eval_mean_accuracy": 0.9802022796399172,
"eval_mean_iou": 0.4901011398199586,
"eval_overall_accuracy": 0.9802022796399172,
"eval_runtime": 8.4024,
"eval_samples_per_second": 30.23,
"eval_steps_per_second": 3.808,
"step": 11500
},
{
"epoch": 92.8,
"grad_norm": 2.616292953491211,
"learning_rate": 3.1e-05,
"loss": 0.0528,
"step": 11600
},
{
"epoch": 93.0,
"eval_accuracy_no_text": 0.9805875116859397,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9805875116859397,
"eval_iou_text": 0.0,
"eval_loss": 0.10085444152355194,
"eval_mean_accuracy": 0.9805875116859397,
"eval_mean_iou": 0.49029375584296986,
"eval_overall_accuracy": 0.9805875116859397,
"eval_runtime": 8.1295,
"eval_samples_per_second": 31.244,
"eval_steps_per_second": 3.936,
"step": 11625
},
{
"epoch": 93.6,
"grad_norm": 0.6591981053352356,
"learning_rate": 3.075e-05,
"loss": 0.0566,
"step": 11700
},
{
"epoch": 94.0,
"eval_accuracy_no_text": 0.9802413096194776,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9802413096194776,
"eval_iou_text": 0.0,
"eval_loss": 0.098316490650177,
"eval_mean_accuracy": 0.9802413096194776,
"eval_mean_iou": 0.4901206548097388,
"eval_overall_accuracy": 0.9802413096194776,
"eval_runtime": 8.5005,
"eval_samples_per_second": 29.881,
"eval_steps_per_second": 3.764,
"step": 11750
},
{
"epoch": 94.4,
"grad_norm": 1.771093487739563,
"learning_rate": 3.05e-05,
"loss": 0.0541,
"step": 11800
},
{
"epoch": 95.0,
"eval_accuracy_no_text": 0.9805775257269292,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9805775257269292,
"eval_iou_text": 0.0,
"eval_loss": 0.10317344218492508,
"eval_mean_accuracy": 0.9805775257269292,
"eval_mean_iou": 0.4902887628634646,
"eval_overall_accuracy": 0.9805775257269292,
"eval_runtime": 8.3723,
"eval_samples_per_second": 30.338,
"eval_steps_per_second": 3.822,
"step": 11875
},
{
"epoch": 95.2,
"grad_norm": 1.3780484199523926,
"learning_rate": 3.025e-05,
"loss": 0.0534,
"step": 11900
},
{
"epoch": 96.0,
"grad_norm": 0.5944967865943909,
"learning_rate": 3e-05,
"loss": 0.0577,
"step": 12000
},
{
"epoch": 96.0,
"eval_accuracy_no_text": 0.9799943357513698,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9799943357513698,
"eval_iou_text": 0.0,
"eval_loss": 0.10296148806810379,
"eval_mean_accuracy": 0.9799943357513698,
"eval_mean_iou": 0.4899971678756849,
"eval_overall_accuracy": 0.9799943357513698,
"eval_runtime": 8.2647,
"eval_samples_per_second": 30.733,
"eval_steps_per_second": 3.872,
"step": 12000
},
{
"epoch": 96.8,
"grad_norm": 0.368669718503952,
"learning_rate": 2.975e-05,
"loss": 0.0567,
"step": 12100
},
{
"epoch": 97.0,
"eval_accuracy_no_text": 0.9795809070789898,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9795809070789898,
"eval_iou_text": 0.0,
"eval_loss": 0.10392536222934723,
"eval_mean_accuracy": 0.9795809070789898,
"eval_mean_iou": 0.4897904535394949,
"eval_overall_accuracy": 0.9795809070789898,
"eval_runtime": 8.318,
"eval_samples_per_second": 30.536,
"eval_steps_per_second": 3.847,
"step": 12125
},
{
"epoch": 97.6,
"grad_norm": 0.6572363376617432,
"learning_rate": 2.95e-05,
"loss": 0.056,
"step": 12200
},
{
"epoch": 98.0,
"eval_accuracy_no_text": 0.9788773871281321,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9788773871281321,
"eval_iou_text": 0.0,
"eval_loss": 0.10201127082109451,
"eval_mean_accuracy": 0.9788773871281321,
"eval_mean_iou": 0.48943869356406605,
"eval_overall_accuracy": 0.9788773871281321,
"eval_runtime": 8.2133,
"eval_samples_per_second": 30.925,
"eval_steps_per_second": 3.896,
"step": 12250
},
{
"epoch": 98.4,
"grad_norm": 0.1991199553012848,
"learning_rate": 2.9249999999999996e-05,
"loss": 0.0517,
"step": 12300
},
{
"epoch": 99.0,
"eval_accuracy_no_text": 0.981906671825248,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.981906671825248,
"eval_iou_text": 0.0,
"eval_loss": 0.10037293285131454,
"eval_mean_accuracy": 0.981906671825248,
"eval_mean_iou": 0.490953335912624,
"eval_overall_accuracy": 0.981906671825248,
"eval_runtime": 8.1469,
"eval_samples_per_second": 31.178,
"eval_steps_per_second": 3.928,
"step": 12375
},
{
"epoch": 99.2,
"grad_norm": 0.3791349530220032,
"learning_rate": 2.9e-05,
"loss": 0.0562,
"step": 12400
},
{
"epoch": 100.0,
"grad_norm": 0.8666055798530579,
"learning_rate": 2.875e-05,
"loss": 0.051,
"step": 12500
},
{
"epoch": 100.0,
"eval_accuracy_no_text": 0.9826272227378127,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9826272227378127,
"eval_iou_text": 0.0,
"eval_loss": 0.09898550808429718,
"eval_mean_accuracy": 0.9826272227378127,
"eval_mean_iou": 0.49131361136890633,
"eval_overall_accuracy": 0.9826272227378127,
"eval_runtime": 8.2239,
"eval_samples_per_second": 30.886,
"eval_steps_per_second": 3.891,
"step": 12500
},
{
"epoch": 100.8,
"grad_norm": 1.307895541191101,
"learning_rate": 2.8500000000000005e-05,
"loss": 0.0523,
"step": 12600
},
{
"epoch": 101.0,
"eval_accuracy_no_text": 0.9826056889559862,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9826056889559862,
"eval_iou_text": 0.0,
"eval_loss": 0.09835489839315414,
"eval_mean_accuracy": 0.9826056889559862,
"eval_mean_iou": 0.4913028444779931,
"eval_overall_accuracy": 0.9826056889559862,
"eval_runtime": 8.309,
"eval_samples_per_second": 30.569,
"eval_steps_per_second": 3.851,
"step": 12625
},
{
"epoch": 101.6,
"grad_norm": 0.38712045550346375,
"learning_rate": 2.825e-05,
"loss": 0.0521,
"step": 12700
},
{
"epoch": 102.0,
"eval_accuracy_no_text": 0.9799104769574827,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9799104769574827,
"eval_iou_text": 0.0,
"eval_loss": 0.098680280148983,
"eval_mean_accuracy": 0.9799104769574827,
"eval_mean_iou": 0.48995523847874134,
"eval_overall_accuracy": 0.9799104769574827,
"eval_runtime": 8.3754,
"eval_samples_per_second": 30.327,
"eval_steps_per_second": 3.821,
"step": 12750
},
{
"epoch": 102.4,
"grad_norm": 0.2037675976753235,
"learning_rate": 2.7999999999999996e-05,
"loss": 0.0518,
"step": 12800
},
{
"epoch": 103.0,
"eval_accuracy_no_text": 0.9818977160317262,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9818977160317262,
"eval_iou_text": 0.0,
"eval_loss": 0.10650473833084106,
"eval_mean_accuracy": 0.9818977160317262,
"eval_mean_iou": 0.4909488580158631,
"eval_overall_accuracy": 0.9818977160317262,
"eval_runtime": 8.2263,
"eval_samples_per_second": 30.876,
"eval_steps_per_second": 3.89,
"step": 12875
},
{
"epoch": 103.2,
"grad_norm": 0.6227338314056396,
"learning_rate": 2.7750000000000004e-05,
"loss": 0.0551,
"step": 12900
},
{
"epoch": 104.0,
"grad_norm": 0.6191376447677612,
"learning_rate": 2.7500000000000004e-05,
"loss": 0.0521,
"step": 13000
},
{
"epoch": 104.0,
"eval_accuracy_no_text": 0.9808840830376523,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9808840830376523,
"eval_iou_text": 0.0,
"eval_loss": 0.10519281029701233,
"eval_mean_accuracy": 0.9808840830376523,
"eval_mean_iou": 0.49044204151882614,
"eval_overall_accuracy": 0.9808840830376523,
"eval_runtime": 8.3514,
"eval_samples_per_second": 30.414,
"eval_steps_per_second": 3.832,
"step": 13000
},
{
"epoch": 104.8,
"grad_norm": 0.30404117703437805,
"learning_rate": 2.725e-05,
"loss": 0.0556,
"step": 13100
},
{
"epoch": 105.0,
"eval_accuracy_no_text": 0.9817842316722551,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9817842316722551,
"eval_iou_text": 0.0,
"eval_loss": 0.10063216090202332,
"eval_mean_accuracy": 0.9817842316722551,
"eval_mean_iou": 0.4908921158361276,
"eval_overall_accuracy": 0.9817842316722551,
"eval_runtime": 8.2778,
"eval_samples_per_second": 30.685,
"eval_steps_per_second": 3.866,
"step": 13125
},
{
"epoch": 105.6,
"grad_norm": 0.7706215977668762,
"learning_rate": 2.7e-05,
"loss": 0.0544,
"step": 13200
},
{
"epoch": 106.0,
"eval_accuracy_no_text": 0.9808936702229253,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9808936702229253,
"eval_iou_text": 0.0,
"eval_loss": 0.10449624061584473,
"eval_mean_accuracy": 0.9808936702229253,
"eval_mean_iou": 0.49044683511146264,
"eval_overall_accuracy": 0.9808936702229253,
"eval_runtime": 8.4473,
"eval_samples_per_second": 30.069,
"eval_steps_per_second": 3.788,
"step": 13250
},
{
"epoch": 106.4,
"grad_norm": 0.3159944713115692,
"learning_rate": 2.675e-05,
"loss": 0.0549,
"step": 13300
},
{
"epoch": 107.0,
"eval_accuracy_no_text": 0.9823117428647125,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9823117428647125,
"eval_iou_text": 0.0,
"eval_loss": 0.101432666182518,
"eval_mean_accuracy": 0.9823117428647125,
"eval_mean_iou": 0.49115587143235623,
"eval_overall_accuracy": 0.9823117428647125,
"eval_runtime": 8.2997,
"eval_samples_per_second": 30.604,
"eval_steps_per_second": 3.856,
"step": 13375
},
{
"epoch": 107.2,
"grad_norm": 0.7384445667266846,
"learning_rate": 2.6500000000000004e-05,
"loss": 0.0506,
"step": 13400
},
{
"epoch": 108.0,
"grad_norm": 1.998416543006897,
"learning_rate": 2.625e-05,
"loss": 0.054,
"step": 13500
},
{
"epoch": 108.0,
"eval_accuracy_no_text": 0.9808719370542301,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9808719370542301,
"eval_iou_text": 0.0,
"eval_loss": 0.10262825340032578,
"eval_mean_accuracy": 0.9808719370542301,
"eval_mean_iou": 0.4904359685271151,
"eval_overall_accuracy": 0.9808719370542301,
"eval_runtime": 8.2241,
"eval_samples_per_second": 30.885,
"eval_steps_per_second": 3.891,
"step": 13500
},
{
"epoch": 108.8,
"grad_norm": 0.29045435786247253,
"learning_rate": 2.5999999999999995e-05,
"loss": 0.0526,
"step": 13600
},
{
"epoch": 109.0,
"eval_accuracy_no_text": 0.9836949560356109,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9836949560356109,
"eval_iou_text": 0.0,
"eval_loss": 0.10518956929445267,
"eval_mean_accuracy": 0.9836949560356109,
"eval_mean_iou": 0.49184747801780543,
"eval_overall_accuracy": 0.9836949560356109,
"eval_runtime": 8.301,
"eval_samples_per_second": 30.599,
"eval_steps_per_second": 3.855,
"step": 13625
},
{
"epoch": 109.6,
"grad_norm": 0.6301660537719727,
"learning_rate": 2.575e-05,
"loss": 0.0524,
"step": 13700
},
{
"epoch": 110.0,
"eval_accuracy_no_text": 0.9830132357157378,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9830132357157378,
"eval_iou_text": 0.0,
"eval_loss": 0.09869378805160522,
"eval_mean_accuracy": 0.9830132357157378,
"eval_mean_iou": 0.4915066178578689,
"eval_overall_accuracy": 0.9830132357157378,
"eval_runtime": 8.2194,
"eval_samples_per_second": 30.903,
"eval_steps_per_second": 3.893,
"step": 13750
},
{
"epoch": 110.4,
"grad_norm": 5.493782043457031,
"learning_rate": 2.55e-05,
"loss": 0.0487,
"step": 13800
},
{
"epoch": 111.0,
"eval_accuracy_no_text": 0.9800823152072116,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9800823152072116,
"eval_iou_text": 0.0,
"eval_loss": 0.10276078432798386,
"eval_mean_accuracy": 0.9800823152072116,
"eval_mean_iou": 0.4900411576036058,
"eval_overall_accuracy": 0.9800823152072116,
"eval_runtime": 11.9277,
"eval_samples_per_second": 21.295,
"eval_steps_per_second": 2.683,
"step": 13875
},
{
"epoch": 111.2,
"grad_norm": 0.2871710956096649,
"learning_rate": 2.5250000000000004e-05,
"loss": 0.0536,
"step": 13900
},
{
"epoch": 112.0,
"grad_norm": 0.9292570948600769,
"learning_rate": 2.5000000000000005e-05,
"loss": 0.054,
"step": 14000
},
{
"epoch": 112.0,
"eval_accuracy_no_text": 0.9829168155491185,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9829168155491185,
"eval_iou_text": 0.0,
"eval_loss": 0.1070096418261528,
"eval_mean_accuracy": 0.9829168155491185,
"eval_mean_iou": 0.49145840777455924,
"eval_overall_accuracy": 0.9829168155491185,
"eval_runtime": 8.2923,
"eval_samples_per_second": 30.631,
"eval_steps_per_second": 3.859,
"step": 14000
},
{
"epoch": 112.8,
"grad_norm": 0.38912442326545715,
"learning_rate": 2.4750000000000002e-05,
"loss": 0.0531,
"step": 14100
},
{
"epoch": 113.0,
"eval_accuracy_no_text": 0.9806236837870479,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9806236837870479,
"eval_iou_text": 0.0,
"eval_loss": 0.10462525486946106,
"eval_mean_accuracy": 0.9806236837870479,
"eval_mean_iou": 0.49031184189352395,
"eval_overall_accuracy": 0.9806236837870479,
"eval_runtime": 8.2827,
"eval_samples_per_second": 30.666,
"eval_steps_per_second": 3.863,
"step": 14125
},
{
"epoch": 113.6,
"grad_norm": 0.5761541128158569,
"learning_rate": 2.45e-05,
"loss": 0.0478,
"step": 14200
},
{
"epoch": 114.0,
"eval_accuracy_no_text": 0.9830612214888201,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9830612214888201,
"eval_iou_text": 0.0,
"eval_loss": 0.10361193120479584,
"eval_mean_accuracy": 0.9830612214888201,
"eval_mean_iou": 0.49153061074441007,
"eval_overall_accuracy": 0.9830612214888201,
"eval_runtime": 8.3565,
"eval_samples_per_second": 30.396,
"eval_steps_per_second": 3.829,
"step": 14250
},
{
"epoch": 114.4,
"grad_norm": 0.43338820338249207,
"learning_rate": 2.425e-05,
"loss": 0.0511,
"step": 14300
},
{
"epoch": 115.0,
"eval_accuracy_no_text": 0.9807316019297658,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9807316019297658,
"eval_iou_text": 0.0,
"eval_loss": 0.10400665551424026,
"eval_mean_accuracy": 0.9807316019297658,
"eval_mean_iou": 0.4903658009648829,
"eval_overall_accuracy": 0.9807316019297658,
"eval_runtime": 8.1898,
"eval_samples_per_second": 31.014,
"eval_steps_per_second": 3.907,
"step": 14375
},
{
"epoch": 115.2,
"grad_norm": 0.4137003421783447,
"learning_rate": 2.4000000000000004e-05,
"loss": 0.0516,
"step": 14400
},
{
"epoch": 116.0,
"grad_norm": 0.34559884667396545,
"learning_rate": 2.375e-05,
"loss": 0.05,
"step": 14500
},
{
"epoch": 116.0,
"eval_accuracy_no_text": 0.9825900370867884,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9825900370867884,
"eval_iou_text": 0.0,
"eval_loss": 0.10383593291044235,
"eval_mean_accuracy": 0.9825900370867884,
"eval_mean_iou": 0.4912950185433942,
"eval_overall_accuracy": 0.9825900370867884,
"eval_runtime": 8.3311,
"eval_samples_per_second": 30.488,
"eval_steps_per_second": 3.841,
"step": 14500
},
{
"epoch": 116.8,
"grad_norm": 0.5693605542182922,
"learning_rate": 2.3500000000000002e-05,
"loss": 0.0522,
"step": 14600
},
{
"epoch": 117.0,
"eval_accuracy_no_text": 0.9813530907997,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9813530907997,
"eval_iou_text": 0.0,
"eval_loss": 0.10510838031768799,
"eval_mean_accuracy": 0.9813530907997,
"eval_mean_iou": 0.49067654539985,
"eval_overall_accuracy": 0.9813530907997,
"eval_runtime": 8.3739,
"eval_samples_per_second": 30.332,
"eval_steps_per_second": 3.821,
"step": 14625
},
{
"epoch": 117.6,
"grad_norm": 3.1022820472717285,
"learning_rate": 2.3250000000000003e-05,
"loss": 0.0492,
"step": 14700
},
{
"epoch": 118.0,
"eval_accuracy_no_text": 0.9816835745346747,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9816835745346747,
"eval_iou_text": 0.0,
"eval_loss": 0.10122588276863098,
"eval_mean_accuracy": 0.9816835745346747,
"eval_mean_iou": 0.49084178726733735,
"eval_overall_accuracy": 0.9816835745346747,
"eval_runtime": 8.251,
"eval_samples_per_second": 30.784,
"eval_steps_per_second": 3.878,
"step": 14750
},
{
"epoch": 118.4,
"grad_norm": 6.673212051391602,
"learning_rate": 2.3000000000000003e-05,
"loss": 0.0526,
"step": 14800
},
{
"epoch": 119.0,
"eval_accuracy_no_text": 0.9810688315871336,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9810688315871336,
"eval_iou_text": 0.0,
"eval_loss": 0.10411898046731949,
"eval_mean_accuracy": 0.9810688315871336,
"eval_mean_iou": 0.4905344157935668,
"eval_overall_accuracy": 0.9810688315871336,
"eval_runtime": 8.5831,
"eval_samples_per_second": 29.593,
"eval_steps_per_second": 3.728,
"step": 14875
},
{
"epoch": 119.2,
"grad_norm": 1.0424220561981201,
"learning_rate": 2.275e-05,
"loss": 0.0483,
"step": 14900
},
{
"epoch": 120.0,
"grad_norm": 0.8458845019340515,
"learning_rate": 2.25e-05,
"loss": 0.0483,
"step": 15000
},
{
"epoch": 120.0,
"eval_accuracy_no_text": 0.9836277958919825,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9836277958919825,
"eval_iou_text": 0.0,
"eval_loss": 0.10483555495738983,
"eval_mean_accuracy": 0.9836277958919825,
"eval_mean_iou": 0.49181389794599123,
"eval_overall_accuracy": 0.9836277958919825,
"eval_runtime": 8.2865,
"eval_samples_per_second": 30.652,
"eval_steps_per_second": 3.862,
"step": 15000
},
{
"epoch": 120.8,
"grad_norm": 0.9494897127151489,
"learning_rate": 2.2250000000000002e-05,
"loss": 0.0496,
"step": 15100
},
{
"epoch": 121.0,
"eval_accuracy_no_text": 0.9807214830461761,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9807214830461761,
"eval_iou_text": 0.0,
"eval_loss": 0.10666216909885406,
"eval_mean_accuracy": 0.9807214830461761,
"eval_mean_iou": 0.49036074152308806,
"eval_overall_accuracy": 0.9807214830461761,
"eval_runtime": 8.3274,
"eval_samples_per_second": 30.502,
"eval_steps_per_second": 3.843,
"step": 15125
},
{
"epoch": 121.6,
"grad_norm": 0.33741095662117004,
"learning_rate": 2.2e-05,
"loss": 0.0486,
"step": 15200
},
{
"epoch": 122.0,
"eval_accuracy_no_text": 0.9799435585621249,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9799435585621249,
"eval_iou_text": 0.0,
"eval_loss": 0.10895564407110214,
"eval_mean_accuracy": 0.9799435585621249,
"eval_mean_iou": 0.48997177928106245,
"eval_overall_accuracy": 0.9799435585621249,
"eval_runtime": 8.4498,
"eval_samples_per_second": 30.06,
"eval_steps_per_second": 3.787,
"step": 15250
},
{
"epoch": 122.4,
"grad_norm": 0.38935738801956177,
"learning_rate": 2.175e-05,
"loss": 0.0539,
"step": 15300
},
{
"epoch": 123.0,
"eval_accuracy_no_text": 0.9796546303737149,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9796546303737149,
"eval_iou_text": 0.0,
"eval_loss": 0.10292521864175797,
"eval_mean_accuracy": 0.9796546303737149,
"eval_mean_iou": 0.48982731518685746,
"eval_overall_accuracy": 0.9796546303737149,
"eval_runtime": 8.2096,
"eval_samples_per_second": 30.939,
"eval_steps_per_second": 3.898,
"step": 15375
},
{
"epoch": 123.2,
"grad_norm": 0.4297466278076172,
"learning_rate": 2.15e-05,
"loss": 0.0498,
"step": 15400
},
{
"epoch": 124.0,
"grad_norm": 0.7218087911605835,
"learning_rate": 2.1249999999999998e-05,
"loss": 0.0507,
"step": 15500
},
{
"epoch": 124.0,
"eval_accuracy_no_text": 0.9803565552296226,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9803565552296226,
"eval_iou_text": 0.0,
"eval_loss": 0.10427888482809067,
"eval_mean_accuracy": 0.9803565552296226,
"eval_mean_iou": 0.4901782776148113,
"eval_overall_accuracy": 0.9803565552296226,
"eval_runtime": 8.4272,
"eval_samples_per_second": 30.14,
"eval_steps_per_second": 3.797,
"step": 15500
},
{
"epoch": 124.8,
"grad_norm": 0.3873758316040039,
"learning_rate": 2.1e-05,
"loss": 0.0482,
"step": 15600
},
{
"epoch": 125.0,
"eval_accuracy_no_text": 0.9791164519837788,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9791164519837788,
"eval_iou_text": 0.0,
"eval_loss": 0.1063632071018219,
"eval_mean_accuracy": 0.9791164519837788,
"eval_mean_iou": 0.4895582259918894,
"eval_overall_accuracy": 0.9791164519837788,
"eval_runtime": 8.3041,
"eval_samples_per_second": 30.587,
"eval_steps_per_second": 3.854,
"step": 15625
},
{
"epoch": 125.6,
"grad_norm": 0.4336509704589844,
"learning_rate": 2.075e-05,
"loss": 0.0487,
"step": 15700
},
{
"epoch": 126.0,
"eval_accuracy_no_text": 0.981322318759621,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.981322318759621,
"eval_iou_text": 0.0,
"eval_loss": 0.10696995258331299,
"eval_mean_accuracy": 0.981322318759621,
"eval_mean_iou": 0.4906611593798105,
"eval_overall_accuracy": 0.981322318759621,
"eval_runtime": 8.3258,
"eval_samples_per_second": 30.508,
"eval_steps_per_second": 3.843,
"step": 15750
},
{
"epoch": 126.4,
"grad_norm": 0.6076303124427795,
"learning_rate": 2.0499999999999997e-05,
"loss": 0.0492,
"step": 15800
},
{
"epoch": 127.0,
"eval_accuracy_no_text": 0.9836348408946788,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9836348408946788,
"eval_iou_text": 0.0,
"eval_loss": 0.11010294407606125,
"eval_mean_accuracy": 0.9836348408946788,
"eval_mean_iou": 0.4918174204473394,
"eval_overall_accuracy": 0.9836348408946788,
"eval_runtime": 8.4835,
"eval_samples_per_second": 29.941,
"eval_steps_per_second": 3.772,
"step": 15875
},
{
"epoch": 127.2,
"grad_norm": 0.2879132032394409,
"learning_rate": 2.0249999999999998e-05,
"loss": 0.0507,
"step": 15900
},
{
"epoch": 128.0,
"grad_norm": 0.3296537697315216,
"learning_rate": 1.9999999999999998e-05,
"loss": 0.0479,
"step": 16000
},
{
"epoch": 128.0,
"eval_accuracy_no_text": 0.9799868587437913,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9799868587437913,
"eval_iou_text": 0.0,
"eval_loss": 0.10447646677494049,
"eval_mean_accuracy": 0.9799868587437913,
"eval_mean_iou": 0.48999342937189566,
"eval_overall_accuracy": 0.9799868587437913,
"eval_runtime": 8.3118,
"eval_samples_per_second": 30.559,
"eval_steps_per_second": 3.85,
"step": 16000
},
{
"epoch": 128.8,
"grad_norm": 0.43510717153549194,
"learning_rate": 1.9749999999999996e-05,
"loss": 0.0514,
"step": 16100
},
{
"epoch": 129.0,
"eval_accuracy_no_text": 0.9819989048676233,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9819989048676233,
"eval_iou_text": 0.0,
"eval_loss": 0.10433124750852585,
"eval_mean_accuracy": 0.9819989048676233,
"eval_mean_iou": 0.49099945243381166,
"eval_overall_accuracy": 0.9819989048676233,
"eval_runtime": 8.1845,
"eval_samples_per_second": 31.034,
"eval_steps_per_second": 3.91,
"step": 16125
},
{
"epoch": 129.6,
"grad_norm": 0.9808353781700134,
"learning_rate": 1.9499999999999996e-05,
"loss": 0.0505,
"step": 16200
},
{
"epoch": 130.0,
"eval_accuracy_no_text": 0.9821372295078277,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9821372295078277,
"eval_iou_text": 0.0,
"eval_loss": 0.1069905087351799,
"eval_mean_accuracy": 0.9821372295078277,
"eval_mean_iou": 0.49106861475391383,
"eval_overall_accuracy": 0.9821372295078277,
"eval_runtime": 8.336,
"eval_samples_per_second": 30.47,
"eval_steps_per_second": 3.839,
"step": 16250
},
{
"epoch": 130.4,
"grad_norm": 0.44676822423934937,
"learning_rate": 1.9250000000000004e-05,
"loss": 0.0491,
"step": 16300
},
{
"epoch": 131.0,
"eval_accuracy_no_text": 0.9810748464243413,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9810748464243413,
"eval_iou_text": 0.0,
"eval_loss": 0.10192025452852249,
"eval_mean_accuracy": 0.9810748464243413,
"eval_mean_iou": 0.49053742321217064,
"eval_overall_accuracy": 0.9810748464243413,
"eval_runtime": 8.1762,
"eval_samples_per_second": 31.066,
"eval_steps_per_second": 3.914,
"step": 16375
},
{
"epoch": 131.2,
"grad_norm": 0.2674311101436615,
"learning_rate": 1.9000000000000008e-05,
"loss": 0.0479,
"step": 16400
},
{
"epoch": 132.0,
"grad_norm": 0.18870976567268372,
"learning_rate": 1.8750000000000002e-05,
"loss": 0.0477,
"step": 16500
},
{
"epoch": 132.0,
"eval_accuracy_no_text": 0.9808076347890541,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9808076347890541,
"eval_iou_text": 0.0,
"eval_loss": 0.10085348039865494,
"eval_mean_accuracy": 0.9808076347890541,
"eval_mean_iou": 0.49040381739452704,
"eval_overall_accuracy": 0.9808076347890541,
"eval_runtime": 8.2705,
"eval_samples_per_second": 30.712,
"eval_steps_per_second": 3.869,
"step": 16500
},
{
"epoch": 132.8,
"grad_norm": 1.6924952268600464,
"learning_rate": 1.8500000000000006e-05,
"loss": 0.0476,
"step": 16600
},
{
"epoch": 133.0,
"eval_accuracy_no_text": 0.9818020435658646,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9818020435658646,
"eval_iou_text": 0.0,
"eval_loss": 0.10147301107645035,
"eval_mean_accuracy": 0.9818020435658646,
"eval_mean_iou": 0.4909010217829323,
"eval_overall_accuracy": 0.9818020435658646,
"eval_runtime": 8.2767,
"eval_samples_per_second": 30.688,
"eval_steps_per_second": 3.866,
"step": 16625
},
{
"epoch": 133.6,
"grad_norm": 0.26980453729629517,
"learning_rate": 1.8250000000000003e-05,
"loss": 0.0462,
"step": 16700
},
{
"epoch": 134.0,
"eval_accuracy_no_text": 0.9804314416144155,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9804314416144155,
"eval_iou_text": 0.0,
"eval_loss": 0.10597039759159088,
"eval_mean_accuracy": 0.9804314416144155,
"eval_mean_iou": 0.49021572080720777,
"eval_overall_accuracy": 0.9804314416144155,
"eval_runtime": 8.2302,
"eval_samples_per_second": 30.862,
"eval_steps_per_second": 3.888,
"step": 16750
},
{
"epoch": 134.4,
"grad_norm": 0.5653632283210754,
"learning_rate": 1.8000000000000004e-05,
"loss": 0.0485,
"step": 16800
},
{
"epoch": 135.0,
"eval_accuracy_no_text": 0.9795444691287234,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9795444691287234,
"eval_iou_text": 0.0,
"eval_loss": 0.10182661563158035,
"eval_mean_accuracy": 0.9795444691287234,
"eval_mean_iou": 0.4897722345643617,
"eval_overall_accuracy": 0.9795444691287234,
"eval_runtime": 8.1917,
"eval_samples_per_second": 31.007,
"eval_steps_per_second": 3.906,
"step": 16875
},
{
"epoch": 135.2,
"grad_norm": 0.603354275226593,
"learning_rate": 1.775e-05,
"loss": 0.0518,
"step": 16900
},
{
"epoch": 136.0,
"grad_norm": 0.7962479591369629,
"learning_rate": 1.7500000000000002e-05,
"loss": 0.0483,
"step": 17000
},
{
"epoch": 136.0,
"eval_accuracy_no_text": 0.9795505836593654,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9795505836593654,
"eval_iou_text": 0.0,
"eval_loss": 0.10557083040475845,
"eval_mean_accuracy": 0.9795505836593654,
"eval_mean_iou": 0.4897752918296827,
"eval_overall_accuracy": 0.9795505836593654,
"eval_runtime": 8.2516,
"eval_samples_per_second": 30.782,
"eval_steps_per_second": 3.878,
"step": 17000
},
{
"epoch": 136.8,
"grad_norm": 0.2562846839427948,
"learning_rate": 1.725e-05,
"loss": 0.0503,
"step": 17100
},
{
"epoch": 137.0,
"eval_accuracy_no_text": 0.9820201229535742,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9820201229535742,
"eval_iou_text": 0.0,
"eval_loss": 0.10440485179424286,
"eval_mean_accuracy": 0.9820201229535742,
"eval_mean_iou": 0.4910100614767871,
"eval_overall_accuracy": 0.9820201229535742,
"eval_runtime": 8.1927,
"eval_samples_per_second": 31.003,
"eval_steps_per_second": 3.906,
"step": 17125
},
{
"epoch": 137.6,
"grad_norm": 0.45571181178092957,
"learning_rate": 1.7000000000000003e-05,
"loss": 0.0514,
"step": 17200
},
{
"epoch": 138.0,
"eval_accuracy_no_text": 0.9812987744935345,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9812987744935345,
"eval_iou_text": 0.0,
"eval_loss": 0.10530504584312439,
"eval_mean_accuracy": 0.9812987744935345,
"eval_mean_iou": 0.49064938724676727,
"eval_overall_accuracy": 0.9812987744935345,
"eval_runtime": 8.2797,
"eval_samples_per_second": 30.678,
"eval_steps_per_second": 3.865,
"step": 17250
},
{
"epoch": 138.4,
"grad_norm": 0.21188737452030182,
"learning_rate": 1.675e-05,
"loss": 0.0446,
"step": 17300
},
{
"epoch": 139.0,
"eval_accuracy_no_text": 0.9807978980636295,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9807978980636295,
"eval_iou_text": 0.0,
"eval_loss": 0.10513133555650711,
"eval_mean_accuracy": 0.9807978980636295,
"eval_mean_iou": 0.49039894903181475,
"eval_overall_accuracy": 0.9807978980636295,
"eval_runtime": 8.251,
"eval_samples_per_second": 30.784,
"eval_steps_per_second": 3.878,
"step": 17375
},
{
"epoch": 139.2,
"grad_norm": 0.8840853571891785,
"learning_rate": 1.65e-05,
"loss": 0.0504,
"step": 17400
},
{
"epoch": 140.0,
"grad_norm": 0.943657398223877,
"learning_rate": 1.625e-05,
"loss": 0.047,
"step": 17500
},
{
"epoch": 140.0,
"eval_accuracy_no_text": 0.9806808579716656,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9806808579716656,
"eval_iou_text": 0.0,
"eval_loss": 0.1071048378944397,
"eval_mean_accuracy": 0.9806808579716656,
"eval_mean_iou": 0.4903404289858328,
"eval_overall_accuracy": 0.9806808579716656,
"eval_runtime": 8.5372,
"eval_samples_per_second": 29.752,
"eval_steps_per_second": 3.748,
"step": 17500
},
{
"epoch": 140.8,
"grad_norm": 0.7239159941673279,
"learning_rate": 1.6e-05,
"loss": 0.0467,
"step": 17600
},
{
"epoch": 141.0,
"eval_accuracy_no_text": 0.9828105755792126,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9828105755792126,
"eval_iou_text": 0.0,
"eval_loss": 0.10849156975746155,
"eval_mean_accuracy": 0.9828105755792126,
"eval_mean_iou": 0.4914052877896063,
"eval_overall_accuracy": 0.9828105755792126,
"eval_runtime": 8.3714,
"eval_samples_per_second": 30.341,
"eval_steps_per_second": 3.823,
"step": 17625
},
{
"epoch": 141.6,
"grad_norm": 0.34657156467437744,
"learning_rate": 1.5749999999999997e-05,
"loss": 0.0476,
"step": 17700
},
{
"epoch": 142.0,
"eval_accuracy_no_text": 0.9832416998361954,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9832416998361954,
"eval_iou_text": 0.0,
"eval_loss": 0.1076694130897522,
"eval_mean_accuracy": 0.9832416998361954,
"eval_mean_iou": 0.4916208499180977,
"eval_overall_accuracy": 0.9832416998361954,
"eval_runtime": 8.3324,
"eval_samples_per_second": 30.483,
"eval_steps_per_second": 3.84,
"step": 17750
},
{
"epoch": 142.4,
"grad_norm": 1.23021399974823,
"learning_rate": 1.55e-05,
"loss": 0.0472,
"step": 17800
},
{
"epoch": 143.0,
"eval_accuracy_no_text": 0.9818141397025696,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9818141397025696,
"eval_iou_text": 0.0,
"eval_loss": 0.11224336177110672,
"eval_mean_accuracy": 0.9818141397025696,
"eval_mean_iou": 0.4909070698512848,
"eval_overall_accuracy": 0.9818141397025696,
"eval_runtime": 8.346,
"eval_samples_per_second": 30.434,
"eval_steps_per_second": 3.834,
"step": 17875
},
{
"epoch": 143.2,
"grad_norm": 0.43515679240226746,
"learning_rate": 1.525e-05,
"loss": 0.0474,
"step": 17900
},
{
"epoch": 144.0,
"grad_norm": 0.26305532455444336,
"learning_rate": 1.5e-05,
"loss": 0.0477,
"step": 18000
},
{
"epoch": 144.0,
"eval_accuracy_no_text": 0.9808217912567363,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9808217912567363,
"eval_iou_text": 0.0,
"eval_loss": 0.10432812571525574,
"eval_mean_accuracy": 0.9808217912567363,
"eval_mean_iou": 0.49041089562836815,
"eval_overall_accuracy": 0.9808217912567363,
"eval_runtime": 8.2922,
"eval_samples_per_second": 30.631,
"eval_steps_per_second": 3.859,
"step": 18000
},
{
"epoch": 144.8,
"grad_norm": 0.24621394276618958,
"learning_rate": 1.4749999999999998e-05,
"loss": 0.0467,
"step": 18100
},
{
"epoch": 145.0,
"eval_accuracy_no_text": 0.9796973988570646,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9796973988570646,
"eval_iou_text": 0.0,
"eval_loss": 0.10507868975400925,
"eval_mean_accuracy": 0.9796973988570646,
"eval_mean_iou": 0.4898486994285323,
"eval_overall_accuracy": 0.9796973988570646,
"eval_runtime": 8.3989,
"eval_samples_per_second": 30.242,
"eval_steps_per_second": 3.81,
"step": 18125
},
{
"epoch": 145.6,
"grad_norm": 0.8053872585296631,
"learning_rate": 1.45e-05,
"loss": 0.0493,
"step": 18200
},
{
"epoch": 146.0,
"eval_accuracy_no_text": 0.9794659273180032,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9794659273180032,
"eval_iou_text": 0.0,
"eval_loss": 0.1048658937215805,
"eval_mean_accuracy": 0.9794659273180032,
"eval_mean_iou": 0.4897329636590016,
"eval_overall_accuracy": 0.9794659273180032,
"eval_runtime": 8.2794,
"eval_samples_per_second": 30.678,
"eval_steps_per_second": 3.865,
"step": 18250
},
{
"epoch": 146.4,
"grad_norm": 0.3059195876121521,
"learning_rate": 1.4249999999999999e-05,
"loss": 0.0485,
"step": 18300
},
{
"epoch": 147.0,
"eval_accuracy_no_text": 0.9809577398700878,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9809577398700878,
"eval_iou_text": 0.0,
"eval_loss": 0.10593844205141068,
"eval_mean_accuracy": 0.9809577398700878,
"eval_mean_iou": 0.4904788699350439,
"eval_overall_accuracy": 0.9809577398700878,
"eval_runtime": 8.3317,
"eval_samples_per_second": 30.486,
"eval_steps_per_second": 3.841,
"step": 18375
},
{
"epoch": 147.2,
"grad_norm": 0.41579416394233704,
"learning_rate": 1.3999999999999998e-05,
"loss": 0.0469,
"step": 18400
},
{
"epoch": 148.0,
"grad_norm": 0.320431113243103,
"learning_rate": 1.375e-05,
"loss": 0.0462,
"step": 18500
},
{
"epoch": 148.0,
"eval_accuracy_no_text": 0.9786900963960741,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9786900963960741,
"eval_iou_text": 0.0,
"eval_loss": 0.10566265136003494,
"eval_mean_accuracy": 0.9786900963960741,
"eval_mean_iou": 0.48934504819803704,
"eval_overall_accuracy": 0.9786900963960741,
"eval_runtime": 8.2787,
"eval_samples_per_second": 30.681,
"eval_steps_per_second": 3.865,
"step": 18500
},
{
"epoch": 148.8,
"grad_norm": 0.44983476400375366,
"learning_rate": 1.35e-05,
"loss": 0.0474,
"step": 18600
},
{
"epoch": 149.0,
"eval_accuracy_no_text": 0.9800260382635032,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9800260382635032,
"eval_iou_text": 0.0,
"eval_loss": 0.10372522473335266,
"eval_mean_accuracy": 0.9800260382635032,
"eval_mean_iou": 0.4900130191317516,
"eval_overall_accuracy": 0.9800260382635032,
"eval_runtime": 8.1632,
"eval_samples_per_second": 31.115,
"eval_steps_per_second": 3.92,
"step": 18625
},
{
"epoch": 149.6,
"grad_norm": 0.1674959510564804,
"learning_rate": 1.3249999999999999e-05,
"loss": 0.0506,
"step": 18700
},
{
"epoch": 150.0,
"eval_accuracy_no_text": 0.9814382456082342,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9814382456082342,
"eval_iou_text": 0.0,
"eval_loss": 0.10518930852413177,
"eval_mean_accuracy": 0.9814382456082342,
"eval_mean_iou": 0.4907191228041171,
"eval_overall_accuracy": 0.9814382456082342,
"eval_runtime": 8.3279,
"eval_samples_per_second": 30.5,
"eval_steps_per_second": 3.843,
"step": 18750
},
{
"epoch": 150.4,
"grad_norm": 0.31716248393058777,
"learning_rate": 1.3000000000000004e-05,
"loss": 0.0479,
"step": 18800
},
{
"epoch": 151.0,
"eval_accuracy_no_text": 0.9805025396487019,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9805025396487019,
"eval_iou_text": 0.0,
"eval_loss": 0.10686381161212921,
"eval_mean_accuracy": 0.9805025396487019,
"eval_mean_iou": 0.49025126982435097,
"eval_overall_accuracy": 0.9805025396487019,
"eval_runtime": 8.3922,
"eval_samples_per_second": 30.266,
"eval_steps_per_second": 3.813,
"step": 18875
},
{
"epoch": 151.2,
"grad_norm": 0.9992444515228271,
"learning_rate": 1.2750000000000003e-05,
"loss": 0.0464,
"step": 18900
},
{
"epoch": 152.0,
"grad_norm": 0.19730743765830994,
"learning_rate": 1.2500000000000002e-05,
"loss": 0.0439,
"step": 19000
},
{
"epoch": 152.0,
"eval_accuracy_no_text": 0.98159488060922,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.98159488060922,
"eval_iou_text": 0.0,
"eval_loss": 0.1079552099108696,
"eval_mean_accuracy": 0.98159488060922,
"eval_mean_iou": 0.49079744030461,
"eval_overall_accuracy": 0.98159488060922,
"eval_runtime": 8.3262,
"eval_samples_per_second": 30.506,
"eval_steps_per_second": 3.843,
"step": 19000
},
{
"epoch": 152.8,
"grad_norm": 0.3917344808578491,
"learning_rate": 1.2250000000000003e-05,
"loss": 0.0492,
"step": 19100
},
{
"epoch": 153.0,
"eval_accuracy_no_text": 0.9807935613992339,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9807935613992339,
"eval_iou_text": 0.0,
"eval_loss": 0.10192196071147919,
"eval_mean_accuracy": 0.9807935613992339,
"eval_mean_iou": 0.49039678069961695,
"eval_overall_accuracy": 0.9807935613992339,
"eval_runtime": 8.236,
"eval_samples_per_second": 30.84,
"eval_steps_per_second": 3.885,
"step": 19125
},
{
"epoch": 153.6,
"grad_norm": 0.3044929504394531,
"learning_rate": 1.2000000000000002e-05,
"loss": 0.0442,
"step": 19200
},
{
"epoch": 154.0,
"eval_accuracy_no_text": 0.9820950259539395,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9820950259539395,
"eval_iou_text": 0.0,
"eval_loss": 0.1053338274359703,
"eval_mean_accuracy": 0.9820950259539395,
"eval_mean_iou": 0.49104751297696975,
"eval_overall_accuracy": 0.9820950259539395,
"eval_runtime": 8.244,
"eval_samples_per_second": 30.81,
"eval_steps_per_second": 3.882,
"step": 19250
},
{
"epoch": 154.4,
"grad_norm": 0.5873416662216187,
"learning_rate": 1.1750000000000003e-05,
"loss": 0.0484,
"step": 19300
},
{
"epoch": 155.0,
"eval_accuracy_no_text": 0.9818892088586589,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9818892088586589,
"eval_iou_text": 0.0,
"eval_loss": 0.10322853177785873,
"eval_mean_accuracy": 0.9818892088586589,
"eval_mean_iou": 0.49094460442932947,
"eval_overall_accuracy": 0.9818892088586589,
"eval_runtime": 8.2069,
"eval_samples_per_second": 30.95,
"eval_steps_per_second": 3.899,
"step": 19375
},
{
"epoch": 155.2,
"grad_norm": 1.538596272468567,
"learning_rate": 1.1500000000000002e-05,
"loss": 0.0456,
"step": 19400
},
{
"epoch": 156.0,
"grad_norm": 1.1352208852767944,
"learning_rate": 1.1250000000000002e-05,
"loss": 0.0466,
"step": 19500
},
{
"epoch": 156.0,
"eval_accuracy_no_text": 0.9812151483176609,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9812151483176609,
"eval_iou_text": 0.0,
"eval_loss": 0.10393723100423813,
"eval_mean_accuracy": 0.9812151483176609,
"eval_mean_iou": 0.49060757415883044,
"eval_overall_accuracy": 0.9812151483176609,
"eval_runtime": 8.309,
"eval_samples_per_second": 30.569,
"eval_steps_per_second": 3.851,
"step": 19500
},
{
"epoch": 156.8,
"grad_norm": 0.30518653988838196,
"learning_rate": 1.1000000000000001e-05,
"loss": 0.0444,
"step": 19600
},
{
"epoch": 157.0,
"eval_accuracy_no_text": 0.9808679825479997,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9808679825479997,
"eval_iou_text": 0.0,
"eval_loss": 0.103802390396595,
"eval_mean_accuracy": 0.9808679825479997,
"eval_mean_iou": 0.49043399127399984,
"eval_overall_accuracy": 0.9808679825479997,
"eval_runtime": 8.2717,
"eval_samples_per_second": 30.707,
"eval_steps_per_second": 3.869,
"step": 19625
},
{
"epoch": 157.6,
"grad_norm": 0.371191143989563,
"learning_rate": 1.075e-05,
"loss": 0.0463,
"step": 19700
},
{
"epoch": 158.0,
"eval_accuracy_no_text": 0.9814478494090796,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9814478494090796,
"eval_iou_text": 0.0,
"eval_loss": 0.10381000488996506,
"eval_mean_accuracy": 0.9814478494090796,
"eval_mean_iou": 0.4907239247045398,
"eval_overall_accuracy": 0.9814478494090796,
"eval_runtime": 8.5122,
"eval_samples_per_second": 29.839,
"eval_steps_per_second": 3.759,
"step": 19750
},
{
"epoch": 158.4,
"grad_norm": 0.6957194209098816,
"learning_rate": 1.0500000000000001e-05,
"loss": 0.0465,
"step": 19800
},
{
"epoch": 159.0,
"eval_accuracy_no_text": 0.9814518703775997,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9814518703775997,
"eval_iou_text": 0.0,
"eval_loss": 0.10540702193975449,
"eval_mean_accuracy": 0.9814518703775997,
"eval_mean_iou": 0.49072593518879987,
"eval_overall_accuracy": 0.9814518703775997,
"eval_runtime": 8.1775,
"eval_samples_per_second": 31.061,
"eval_steps_per_second": 3.913,
"step": 19875
},
{
"epoch": 159.2,
"grad_norm": 0.21183647215366364,
"learning_rate": 1.025e-05,
"loss": 0.0464,
"step": 19900
},
{
"epoch": 160.0,
"grad_norm": 0.3967491090297699,
"learning_rate": 9.999999999999999e-06,
"loss": 0.046,
"step": 20000
},
{
"epoch": 160.0,
"eval_accuracy_no_text": 0.9804176340737537,
"eval_accuracy_text": NaN,
"eval_iou_no_text": 0.9804176340737537,
"eval_iou_text": 0.0,
"eval_loss": 0.10416771471500397,
"eval_mean_accuracy": 0.9804176340737537,
"eval_mean_iou": 0.49020881703687685,
"eval_overall_accuracy": 0.9804176340737537,
"eval_runtime": 8.2603,
"eval_samples_per_second": 30.75,
"eval_steps_per_second": 3.874,
"step": 20000
},
{
"epoch": 160.0,
"step": 20000,
"total_flos": 2.80447288344576e+18,
"train_loss": 0.01519945946931839,
"train_runtime": 1952.9271,
"train_samples_per_second": 81.928,
"train_steps_per_second": 10.241
}
],
"logging_steps": 100,
"max_steps": 20000,
"num_input_tokens_seen": 0,
"num_train_epochs": 160,
"save_steps": 500,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 2.80447288344576e+18,
"train_batch_size": 8,
"trial_name": null,
"trial_params": null
}