{ "best_global_step": 120, "best_metric": 0.2247939258813858, "best_model_checkpoint": "./llava_adalora_weather_model/checkpoint-120", "epoch": 1.2262210796915167, "eval_steps": 20, "global_step": 120, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.10282776349614396, "grad_norm": 0.5032290816307068, "learning_rate": 6.75e-05, "loss": 2.3108, "mean_token_accuracy": 0.5181779790669679, "num_tokens": 645254.0, "step": 10 }, { "epoch": 0.20565552699228792, "grad_norm": 0.5140016078948975, "learning_rate": 0.0001425, "loss": 1.9876, "mean_token_accuracy": 0.5564090937376023, "num_tokens": 1290816.0, "step": 20 }, { "epoch": 0.20565552699228792, "eval_loss": 1.6786144971847534, "eval_mean_token_accuracy": 0.5918497213950524, "eval_num_tokens": 1290816.0, "eval_runtime": 199.77, "eval_samples_per_second": 0.976, "eval_steps_per_second": 0.976, "step": 20 }, { "epoch": 0.30848329048843187, "grad_norm": 1.200245976448059, "learning_rate": 0.00021749999999999997, "loss": 1.2898, "mean_token_accuracy": 0.6574281774461269, "num_tokens": 1936067.0, "step": 30 }, { "epoch": 0.41131105398457585, "grad_norm": 0.3560621440410614, "learning_rate": 0.00029249999999999995, "loss": 0.5269, "mean_token_accuracy": 0.8504049643874169, "num_tokens": 2581570.0, "step": 40 }, { "epoch": 0.41131105398457585, "eval_loss": 0.3815372884273529, "eval_mean_token_accuracy": 0.8895098340816987, "eval_num_tokens": 2581570.0, "eval_runtime": 199.91, "eval_samples_per_second": 0.975, "eval_steps_per_second": 0.975, "step": 40 }, { "epoch": 0.5141388174807198, "grad_norm": 0.36290714144706726, "learning_rate": 0.0002995163544683256, "loss": 0.3431, "mean_token_accuracy": 0.8966262958943844, "num_tokens": 3226740.0, "step": 50 }, { "epoch": 0.6169665809768637, "grad_norm": 0.3132888674736023, "learning_rate": 0.00029784849709745616, "loss": 0.3131, "mean_token_accuracy": 0.9030718393623829, "num_tokens": 3872000.0, "step": 60 }, { "epoch": 0.6169665809768637, "eval_loss": 0.2877984046936035, "eval_mean_token_accuracy": 0.9094783853261899, "eval_num_tokens": 3872000.0, "eval_runtime": 200.0291, "eval_samples_per_second": 0.975, "eval_steps_per_second": 0.975, "step": 60 }, { "epoch": 0.7197943444730077, "grad_norm": 0.3172520697116852, "learning_rate": 0.0002950037303267096, "loss": 0.2776, "mean_token_accuracy": 0.9121568284928798, "num_tokens": 4517650.0, "step": 70 }, { "epoch": 0.8226221079691517, "grad_norm": 0.2681174576282501, "learning_rate": 0.0002910046991800035, "loss": 0.2463, "mean_token_accuracy": 0.9197294652462006, "num_tokens": 5162524.0, "step": 80 }, { "epoch": 0.8226221079691517, "eval_loss": 0.24699676036834717, "eval_mean_token_accuracy": 0.918833449559334, "eval_num_tokens": 5162524.0, "eval_runtime": 199.9764, "eval_samples_per_second": 0.975, "eval_steps_per_second": 0.975, "step": 80 }, { "epoch": 0.9254498714652957, "grad_norm": 0.25532031059265137, "learning_rate": 0.00028588323690176954, "loss": 0.2409, "mean_token_accuracy": 0.9201722621917725, "num_tokens": 5808159.0, "step": 90 }, { "epoch": 1.0205655526992288, "grad_norm": 0.2883255183696747, "learning_rate": 0.0002796801115567139, "loss": 0.229, "mean_token_accuracy": 0.9240316643908217, "num_tokens": 6405024.0, "step": 100 }, { "epoch": 1.0205655526992288, "eval_loss": 0.2340758889913559, "eval_mean_token_accuracy": 0.9224844058354695, "eval_num_tokens": 6405024.0, "eval_runtime": 199.917, "eval_samples_per_second": 0.975, "eval_steps_per_second": 0.975, "step": 100 }, { "epoch": 1.1233933161953726, "grad_norm": 0.30399489402770996, "learning_rate": 0.0002724447015062708, "loss": 0.2179, "mean_token_accuracy": 0.927613090723753, "num_tokens": 7050233.0, "step": 110 }, { "epoch": 1.2262210796915167, "grad_norm": 0.28451991081237793, "learning_rate": 0.0002642346023450357, "loss": 0.216, "mean_token_accuracy": 0.9265601448714733, "num_tokens": 7695653.0, "step": 120 }, { "epoch": 1.2262210796915167, "eval_loss": 0.2247939258813858, "eval_mean_token_accuracy": 0.925137395125169, "eval_num_tokens": 7695653.0, "eval_runtime": 199.5418, "eval_samples_per_second": 0.977, "eval_steps_per_second": 0.977, "step": 120 } ], "logging_steps": 10, "max_steps": 392, "num_input_tokens_seen": 0, "num_train_epochs": 4, "save_steps": 40, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": false }, "attributes": {} } }, "total_flos": 3.4604890360353197e+17, "train_batch_size": 1, "trial_name": null, "trial_params": null }