{ "best_metric": 3.0374205112457275, "best_model_checkpoint": "../Modelos/bloomz_AEx_SQAC_SQuAD/checkpoint-1000", "epoch": 0.898069151324652, "global_step": 1000, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.04, "eval_loss": 5.792993068695068, "eval_runtime": 79.9398, "eval_samples_per_second": 103.741, "eval_steps_per_second": 25.945, "step": 50 }, { "epoch": 0.09, "eval_loss": 4.746491432189941, "eval_runtime": 79.9383, "eval_samples_per_second": 103.743, "eval_steps_per_second": 25.945, "step": 100 }, { "epoch": 0.13, "eval_loss": 4.1346588134765625, "eval_runtime": 79.9476, "eval_samples_per_second": 103.73, "eval_steps_per_second": 25.942, "step": 150 }, { "epoch": 0.18, "eval_loss": 3.8906848430633545, "eval_runtime": 79.9385, "eval_samples_per_second": 103.742, "eval_steps_per_second": 25.945, "step": 200 }, { "epoch": 0.22, "eval_loss": 3.7085936069488525, "eval_runtime": 79.9395, "eval_samples_per_second": 103.741, "eval_steps_per_second": 25.945, "step": 250 }, { "epoch": 0.27, "eval_loss": 3.563627004623413, "eval_runtime": 79.9406, "eval_samples_per_second": 103.74, "eval_steps_per_second": 25.944, "step": 300 }, { "epoch": 0.31, "eval_loss": 3.4549553394317627, "eval_runtime": 79.9322, "eval_samples_per_second": 103.75, "eval_steps_per_second": 25.947, "step": 350 }, { "epoch": 0.36, "eval_loss": 3.3643569946289062, "eval_runtime": 79.932, "eval_samples_per_second": 103.751, "eval_steps_per_second": 25.947, "step": 400 }, { "epoch": 0.4, "eval_loss": 3.3192312717437744, "eval_runtime": 79.9445, "eval_samples_per_second": 103.734, "eval_steps_per_second": 25.943, "step": 450 }, { "epoch": 0.45, "learning_rate": 4.2572626534890685e-05, "loss": 4.1989, "step": 500 }, { "epoch": 0.45, "eval_loss": 3.2668206691741943, "eval_runtime": 79.9572, "eval_samples_per_second": 103.718, "eval_steps_per_second": 25.939, "step": 500 }, { "epoch": 0.49, "eval_loss": 3.2073845863342285, "eval_runtime": 79.9534, "eval_samples_per_second": 103.723, "eval_steps_per_second": 25.94, "step": 550 }, { "epoch": 0.54, "eval_loss": 3.1692163944244385, "eval_runtime": 79.94, "eval_samples_per_second": 103.74, "eval_steps_per_second": 25.944, "step": 600 }, { "epoch": 0.58, "eval_loss": 3.1374781131744385, "eval_runtime": 79.9406, "eval_samples_per_second": 103.74, "eval_steps_per_second": 25.944, "step": 650 }, { "epoch": 0.63, "eval_loss": 3.1055877208709717, "eval_runtime": 79.926, "eval_samples_per_second": 103.758, "eval_steps_per_second": 25.949, "step": 700 }, { "epoch": 0.67, "eval_loss": 3.0914928913116455, "eval_runtime": 79.9363, "eval_samples_per_second": 103.745, "eval_steps_per_second": 25.946, "step": 750 }, { "epoch": 0.72, "eval_loss": 3.0823092460632324, "eval_runtime": 79.9387, "eval_samples_per_second": 103.742, "eval_steps_per_second": 25.945, "step": 800 }, { "epoch": 0.76, "eval_loss": 3.05977463722229, "eval_runtime": 79.9397, "eval_samples_per_second": 103.741, "eval_steps_per_second": 25.945, "step": 850 }, { "epoch": 0.81, "eval_loss": 3.0491394996643066, "eval_runtime": 79.9347, "eval_samples_per_second": 103.747, "eval_steps_per_second": 25.946, "step": 900 }, { "epoch": 0.85, "eval_loss": 3.039747953414917, "eval_runtime": 79.9452, "eval_samples_per_second": 103.734, "eval_steps_per_second": 25.943, "step": 950 }, { "epoch": 0.9, "learning_rate": 3.508535489667565e-05, "loss": 2.7285, "step": 1000 }, { "epoch": 0.9, "eval_loss": 3.0374205112457275, "eval_runtime": 79.9218, "eval_samples_per_second": 103.764, "eval_steps_per_second": 25.95, "step": 1000 } ], "max_steps": 3339, "num_train_epochs": 3, "total_flos": 4.618973186359296e+16, "trial_name": null, "trial_params": null }