{ "best_metric": 0.7127555988315482, "best_model_checkpoint": "whisper-reg-ben\\checkpoint-6000", "epoch": 3.634161114476075, "eval_steps": 500, "global_step": 6000, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.30284675953967294, "eval_cer": 0.49007230153778397, "eval_loss": 2.5224013328552246, "eval_runtime": 19.2778, "eval_samples_per_second": 6.951, "eval_steps_per_second": 1.764, "eval_wer": 1.0074001947419668, "step": 500 }, { "epoch": 0.6056935190793459, "grad_norm": 6.7337727546691895, "learning_rate": 9.692067457838851e-06, "loss": 2.9581, "step": 1000 }, { "epoch": 0.6056935190793459, "eval_cer": 0.3797115278746284, "eval_loss": 1.7524603605270386, "eval_runtime": 19.6842, "eval_samples_per_second": 6.807, "eval_steps_per_second": 1.727, "eval_wer": 0.84634858812074, "step": 1000 }, { "epoch": 0.9085402786190188, "eval_cer": 0.3615076889198811, "eval_loss": 1.5823218822479248, "eval_runtime": 18.1939, "eval_samples_per_second": 7.365, "eval_steps_per_second": 1.869, "eval_wer": 0.7945472249269717, "step": 1500 }, { "epoch": 1.2113870381586918, "grad_norm": 4.9313130378723145, "learning_rate": 9.067457838850719e-06, "loss": 1.6132, "step": 2000 }, { "epoch": 1.2113870381586918, "eval_cer": 0.3612507799023746, "eval_loss": 1.4997178316116333, "eval_runtime": 21.2924, "eval_samples_per_second": 6.293, "eval_steps_per_second": 1.597, "eval_wer": 0.7700097370983447, "step": 2000 }, { "epoch": 1.5142337976983646, "eval_cer": 0.36807721951040484, "eval_loss": 1.4603444337844849, "eval_runtime": 17.7387, "eval_samples_per_second": 7.554, "eval_steps_per_second": 1.917, "eval_wer": 0.7518987341772152, "step": 2500 }, { "epoch": 1.8170805572380375, "grad_norm": 5.206490516662598, "learning_rate": 8.443472829481576e-06, "loss": 1.5051, "step": 3000 }, { "epoch": 1.8170805572380375, "eval_cer": 0.33611039747495136, "eval_loss": 1.4466902017593384, "eval_runtime": 19.3549, "eval_samples_per_second": 6.923, "eval_steps_per_second": 1.757, "eval_wer": 0.7450827653359299, "step": 3000 }, { "epoch": 2.1199273167777104, "eval_cer": 0.33500935882849486, "eval_loss": 1.4404141902923584, "eval_runtime": 18.1487, "eval_samples_per_second": 7.383, "eval_steps_per_second": 1.873, "eval_wer": 0.7489776046738073, "step": 3500 }, { "epoch": 2.4227740763173835, "grad_norm": 4.5190887451171875, "learning_rate": 7.820737039350407e-06, "loss": 1.3798, "step": 4000 }, { "epoch": 2.4227740763173835, "eval_cer": 0.3345689433699123, "eval_loss": 1.394412636756897, "eval_runtime": 19.6972, "eval_samples_per_second": 6.803, "eval_steps_per_second": 1.726, "eval_wer": 0.7226874391431354, "step": 4000 }, { "epoch": 2.725620835857056, "eval_cer": 0.3381656696150035, "eval_loss": 1.421527624130249, "eval_runtime": 18.6951, "eval_samples_per_second": 7.168, "eval_steps_per_second": 1.819, "eval_wer": 0.7626095423563778, "step": 4500 }, { "epoch": 3.0284675953967293, "grad_norm": 12.196548461914062, "learning_rate": 7.196127420362275e-06, "loss": 1.3506, "step": 5000 }, { "epoch": 3.0284675953967293, "eval_cer": 0.32873343854369286, "eval_loss": 1.3746217489242554, "eval_runtime": 17.0045, "eval_samples_per_second": 7.88, "eval_steps_per_second": 1.999, "eval_wer": 0.7302823758519961, "step": 5000 }, { "epoch": 3.331314354936402, "eval_cer": 0.3210628693067127, "eval_loss": 1.3873779773712158, "eval_runtime": 19.6904, "eval_samples_per_second": 6.805, "eval_steps_per_second": 1.727, "eval_wer": 0.7230769230769231, "step": 5500 }, { "epoch": 3.634161114476075, "grad_norm": 5.505178451538086, "learning_rate": 6.57214241099313e-06, "loss": 1.2704, "step": 6000 }, { "epoch": 3.634161114476075, "eval_cer": 0.31680551987374755, "eval_loss": 1.403659462928772, "eval_runtime": 17.1479, "eval_samples_per_second": 7.814, "eval_steps_per_second": 1.983, "eval_wer": 0.7127555988315482, "step": 6000 } ], "logging_steps": 1000, "max_steps": 16510, "num_input_tokens_seen": 0, "num_train_epochs": 10, "save_steps": 500, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": false }, "attributes": {} } }, "total_flos": 2.7849349072039633e+19, "train_batch_size": 4, "trial_name": null, "trial_params": null }