diff --git a/ppo-lora/README.md b/ppo-lora/README.md new file mode 100644 index 0000000000000000000000000000000000000000..d290c902d52b2091d490255d35c9be86df84f437 --- /dev/null +++ b/ppo-lora/README.md @@ -0,0 +1,3 @@ +--- +library_name: peft +--- diff --git a/ppo-lora/adapter_config.json b/ppo-lora/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..2ef4676864a7f782259cd6700dcab8059e8973ab --- /dev/null +++ b/ppo-lora/adapter_config.json @@ -0,0 +1,20 @@ +{ + "base_model_name_or_path": "llama-13b-hf/", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layers_pattern": null, + "layers_to_transform": null, + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "revision": null, + "target_modules": [ + "q_proj", + "v_proj" + ], + "task_type": "CAUSAL_LM" +} \ No newline at end of file diff --git a/ppo-lora/adapter_model.bin b/ppo-lora/adapter_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..eb62cdc9296da31de38e4265553758f3f7390abd --- /dev/null +++ b/ppo-lora/adapter_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55c6ec1b08f5cea38e43c3e4eb11b0be787f3cd86a46cf09fe0e6e5048737dea +size 26269517 diff --git a/ppo-lora/checkpoint-1000/README.md b/ppo-lora/checkpoint-1000/README.md new file mode 100644 index 0000000000000000000000000000000000000000..d290c902d52b2091d490255d35c9be86df84f437 --- /dev/null +++ b/ppo-lora/checkpoint-1000/README.md @@ -0,0 +1,3 @@ +--- +library_name: peft +--- diff --git a/ppo-lora/checkpoint-1000/adapter_config.json b/ppo-lora/checkpoint-1000/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..2ef4676864a7f782259cd6700dcab8059e8973ab --- /dev/null +++ b/ppo-lora/checkpoint-1000/adapter_config.json @@ -0,0 +1,20 @@ +{ + "base_model_name_or_path": "llama-13b-hf/", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layers_pattern": null, + "layers_to_transform": null, + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "revision": null, + "target_modules": [ + "q_proj", + "v_proj" + ], + "task_type": "CAUSAL_LM" +} \ No newline at end of file diff --git a/ppo-lora/checkpoint-1000/adapter_model.bin b/ppo-lora/checkpoint-1000/adapter_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..0255a24a1a05ccafb8858e40c4a5a921c4903d43 --- /dev/null +++ b/ppo-lora/checkpoint-1000/adapter_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c213d0e4f8d874939ab229e712e25c78ddc973176bd844440186e4b8977c4651 +size 26269517 diff --git a/ppo-lora/checkpoint-1000/finetuning_args.json b/ppo-lora/checkpoint-1000/finetuning_args.json new file mode 100644 index 0000000000000000000000000000000000000000..36a921b3eb84159ad54e7697e9d7d3e2fde38fec --- /dev/null +++ b/ppo-lora/checkpoint-1000/finetuning_args.json @@ -0,0 +1,13 @@ +{ + "finetuning_type": "lora", + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "lora_rank": 8, + "lora_target": [ + "q_proj", + "v_proj" + ], + "name_module_trainable": "mlp", + "num_hidden_layers": 32, + "num_layer_trainable": 3 +} diff --git a/ppo-lora/checkpoint-1000/reward/adapter_config.json b/ppo-lora/checkpoint-1000/reward/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..2ef4676864a7f782259cd6700dcab8059e8973ab --- /dev/null +++ b/ppo-lora/checkpoint-1000/reward/adapter_config.json @@ -0,0 +1,20 @@ +{ + "base_model_name_or_path": "llama-13b-hf/", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layers_pattern": null, + "layers_to_transform": null, + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "revision": null, + "target_modules": [ + "q_proj", + "v_proj" + ], + "task_type": "CAUSAL_LM" +} \ No newline at end of file diff --git a/ppo-lora/checkpoint-1000/reward/adapter_model.bin b/ppo-lora/checkpoint-1000/reward/adapter_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..8710093665dfdb9819e2f8817a1e25a4ccdd9935 --- /dev/null +++ b/ppo-lora/checkpoint-1000/reward/adapter_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5e1621f48d9ad8feb1d6d31050275f0aafd080c5c07153301fe2f48411f4406 +size 443 diff --git a/ppo-lora/checkpoint-1000/training_args.bin b/ppo-lora/checkpoint-1000/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..684a2089f53ed437a099eb02bb62cc1ce00d3664 --- /dev/null +++ b/ppo-lora/checkpoint-1000/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf91d7ac2ddda7e1272b902408951545188f843d4da6b19c2e572a6c86a6075b +size 3274 diff --git a/ppo-lora/checkpoint-1000/value_head.bin b/ppo-lora/checkpoint-1000/value_head.bin new file mode 100644 index 0000000000000000000000000000000000000000..c7675d58ca63fd5f359c2a890e39070d4b390a90 --- /dev/null +++ b/ppo-lora/checkpoint-1000/value_head.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1da5b73c9aa13a16f0875a3c73b3ec6df71a08d94ce82197b9a3d2f077f30a95 +size 21491 diff --git a/ppo-lora/checkpoint-2000/README.md b/ppo-lora/checkpoint-2000/README.md new file mode 100644 index 0000000000000000000000000000000000000000..d290c902d52b2091d490255d35c9be86df84f437 --- /dev/null +++ b/ppo-lora/checkpoint-2000/README.md @@ -0,0 +1,3 @@ +--- +library_name: peft +--- diff --git a/ppo-lora/checkpoint-2000/adapter_config.json b/ppo-lora/checkpoint-2000/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..2ef4676864a7f782259cd6700dcab8059e8973ab --- /dev/null +++ b/ppo-lora/checkpoint-2000/adapter_config.json @@ -0,0 +1,20 @@ +{ + "base_model_name_or_path": "llama-13b-hf/", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layers_pattern": null, + "layers_to_transform": null, + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "revision": null, + "target_modules": [ + "q_proj", + "v_proj" + ], + "task_type": "CAUSAL_LM" +} \ No newline at end of file diff --git a/ppo-lora/checkpoint-2000/adapter_model.bin b/ppo-lora/checkpoint-2000/adapter_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..730f858241580aa6c080966fbcf15a993d8389b0 --- /dev/null +++ b/ppo-lora/checkpoint-2000/adapter_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d0fbeb1c6409498c16a2c2f2e70b7446bf4ac1234fb8dc2f8df9806b2462ddb +size 26269517 diff --git a/ppo-lora/checkpoint-2000/finetuning_args.json b/ppo-lora/checkpoint-2000/finetuning_args.json new file mode 100644 index 0000000000000000000000000000000000000000..36a921b3eb84159ad54e7697e9d7d3e2fde38fec --- /dev/null +++ b/ppo-lora/checkpoint-2000/finetuning_args.json @@ -0,0 +1,13 @@ +{ + "finetuning_type": "lora", + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "lora_rank": 8, + "lora_target": [ + "q_proj", + "v_proj" + ], + "name_module_trainable": "mlp", + "num_hidden_layers": 32, + "num_layer_trainable": 3 +} diff --git a/ppo-lora/checkpoint-2000/reward/adapter_config.json b/ppo-lora/checkpoint-2000/reward/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..2ef4676864a7f782259cd6700dcab8059e8973ab --- /dev/null +++ b/ppo-lora/checkpoint-2000/reward/adapter_config.json @@ -0,0 +1,20 @@ +{ + "base_model_name_or_path": "llama-13b-hf/", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layers_pattern": null, + "layers_to_transform": null, + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "revision": null, + "target_modules": [ + "q_proj", + "v_proj" + ], + "task_type": "CAUSAL_LM" +} \ No newline at end of file diff --git a/ppo-lora/checkpoint-2000/reward/adapter_model.bin b/ppo-lora/checkpoint-2000/reward/adapter_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..8710093665dfdb9819e2f8817a1e25a4ccdd9935 --- /dev/null +++ b/ppo-lora/checkpoint-2000/reward/adapter_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5e1621f48d9ad8feb1d6d31050275f0aafd080c5c07153301fe2f48411f4406 +size 443 diff --git a/ppo-lora/checkpoint-2000/training_args.bin b/ppo-lora/checkpoint-2000/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..684a2089f53ed437a099eb02bb62cc1ce00d3664 --- /dev/null +++ b/ppo-lora/checkpoint-2000/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf91d7ac2ddda7e1272b902408951545188f843d4da6b19c2e572a6c86a6075b +size 3274 diff --git a/ppo-lora/checkpoint-2000/value_head.bin b/ppo-lora/checkpoint-2000/value_head.bin new file mode 100644 index 0000000000000000000000000000000000000000..b13152db4a82961c99f0e4cc2e019e91b367dcbf --- /dev/null +++ b/ppo-lora/checkpoint-2000/value_head.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9c26a0f0760505ea0f2efdc4bd9d8f0ceb4bd4a0d23211e24d96b907f4c0028 +size 21491 diff --git a/ppo-lora/checkpoint-3000/README.md b/ppo-lora/checkpoint-3000/README.md new file mode 100644 index 0000000000000000000000000000000000000000..d290c902d52b2091d490255d35c9be86df84f437 --- /dev/null +++ b/ppo-lora/checkpoint-3000/README.md @@ -0,0 +1,3 @@ +--- +library_name: peft +--- diff --git a/ppo-lora/checkpoint-3000/adapter_config.json b/ppo-lora/checkpoint-3000/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..2ef4676864a7f782259cd6700dcab8059e8973ab --- /dev/null +++ b/ppo-lora/checkpoint-3000/adapter_config.json @@ -0,0 +1,20 @@ +{ + "base_model_name_or_path": "llama-13b-hf/", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layers_pattern": null, + "layers_to_transform": null, + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "revision": null, + "target_modules": [ + "q_proj", + "v_proj" + ], + "task_type": "CAUSAL_LM" +} \ No newline at end of file diff --git a/ppo-lora/checkpoint-3000/adapter_model.bin b/ppo-lora/checkpoint-3000/adapter_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..259711448f27d2e67b257eddf00fcaf310e1e347 --- /dev/null +++ b/ppo-lora/checkpoint-3000/adapter_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ad9d239c7787f8d73de9875ae02a52464859764422d88a4970e344b4fd9faee +size 26269517 diff --git a/ppo-lora/checkpoint-3000/finetuning_args.json b/ppo-lora/checkpoint-3000/finetuning_args.json new file mode 100644 index 0000000000000000000000000000000000000000..36a921b3eb84159ad54e7697e9d7d3e2fde38fec --- /dev/null +++ b/ppo-lora/checkpoint-3000/finetuning_args.json @@ -0,0 +1,13 @@ +{ + "finetuning_type": "lora", + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "lora_rank": 8, + "lora_target": [ + "q_proj", + "v_proj" + ], + "name_module_trainable": "mlp", + "num_hidden_layers": 32, + "num_layer_trainable": 3 +} diff --git a/ppo-lora/checkpoint-3000/reward/adapter_config.json b/ppo-lora/checkpoint-3000/reward/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..2ef4676864a7f782259cd6700dcab8059e8973ab --- /dev/null +++ b/ppo-lora/checkpoint-3000/reward/adapter_config.json @@ -0,0 +1,20 @@ +{ + "base_model_name_or_path": "llama-13b-hf/", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layers_pattern": null, + "layers_to_transform": null, + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "revision": null, + "target_modules": [ + "q_proj", + "v_proj" + ], + "task_type": "CAUSAL_LM" +} \ No newline at end of file diff --git a/ppo-lora/checkpoint-3000/reward/adapter_model.bin b/ppo-lora/checkpoint-3000/reward/adapter_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..8710093665dfdb9819e2f8817a1e25a4ccdd9935 --- /dev/null +++ b/ppo-lora/checkpoint-3000/reward/adapter_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5e1621f48d9ad8feb1d6d31050275f0aafd080c5c07153301fe2f48411f4406 +size 443 diff --git a/ppo-lora/checkpoint-3000/training_args.bin b/ppo-lora/checkpoint-3000/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..684a2089f53ed437a099eb02bb62cc1ce00d3664 --- /dev/null +++ b/ppo-lora/checkpoint-3000/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf91d7ac2ddda7e1272b902408951545188f843d4da6b19c2e572a6c86a6075b +size 3274 diff --git a/ppo-lora/checkpoint-3000/value_head.bin b/ppo-lora/checkpoint-3000/value_head.bin new file mode 100644 index 0000000000000000000000000000000000000000..00622f74a37afe0fb173ce4b3c479dc50b63f262 --- /dev/null +++ b/ppo-lora/checkpoint-3000/value_head.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3817aaf3884ab53bafa9a0a901eb2cc3329b55238d28a98b937ce5db5e888a9 +size 21491 diff --git a/ppo-lora/checkpoint-4000/README.md b/ppo-lora/checkpoint-4000/README.md new file mode 100644 index 0000000000000000000000000000000000000000..d290c902d52b2091d490255d35c9be86df84f437 --- /dev/null +++ b/ppo-lora/checkpoint-4000/README.md @@ -0,0 +1,3 @@ +--- +library_name: peft +--- diff --git a/ppo-lora/checkpoint-4000/adapter_config.json b/ppo-lora/checkpoint-4000/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..2ef4676864a7f782259cd6700dcab8059e8973ab --- /dev/null +++ b/ppo-lora/checkpoint-4000/adapter_config.json @@ -0,0 +1,20 @@ +{ + "base_model_name_or_path": "llama-13b-hf/", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layers_pattern": null, + "layers_to_transform": null, + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "revision": null, + "target_modules": [ + "q_proj", + "v_proj" + ], + "task_type": "CAUSAL_LM" +} \ No newline at end of file diff --git a/ppo-lora/checkpoint-4000/adapter_model.bin b/ppo-lora/checkpoint-4000/adapter_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..cb1ce6acb3016cb41a57baa5a9d20e65a1a1c507 --- /dev/null +++ b/ppo-lora/checkpoint-4000/adapter_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e11cb62dcf8c47decf25bb4525c4921aa48aee0815306027ec7d96a32a459ae +size 26269517 diff --git a/ppo-lora/checkpoint-4000/finetuning_args.json b/ppo-lora/checkpoint-4000/finetuning_args.json new file mode 100644 index 0000000000000000000000000000000000000000..36a921b3eb84159ad54e7697e9d7d3e2fde38fec --- /dev/null +++ b/ppo-lora/checkpoint-4000/finetuning_args.json @@ -0,0 +1,13 @@ +{ + "finetuning_type": "lora", + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "lora_rank": 8, + "lora_target": [ + "q_proj", + "v_proj" + ], + "name_module_trainable": "mlp", + "num_hidden_layers": 32, + "num_layer_trainable": 3 +} diff --git a/ppo-lora/checkpoint-4000/reward/adapter_config.json b/ppo-lora/checkpoint-4000/reward/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..2ef4676864a7f782259cd6700dcab8059e8973ab --- /dev/null +++ b/ppo-lora/checkpoint-4000/reward/adapter_config.json @@ -0,0 +1,20 @@ +{ + "base_model_name_or_path": "llama-13b-hf/", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layers_pattern": null, + "layers_to_transform": null, + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "revision": null, + "target_modules": [ + "q_proj", + "v_proj" + ], + "task_type": "CAUSAL_LM" +} \ No newline at end of file diff --git a/ppo-lora/checkpoint-4000/reward/adapter_model.bin b/ppo-lora/checkpoint-4000/reward/adapter_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..8710093665dfdb9819e2f8817a1e25a4ccdd9935 --- /dev/null +++ b/ppo-lora/checkpoint-4000/reward/adapter_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5e1621f48d9ad8feb1d6d31050275f0aafd080c5c07153301fe2f48411f4406 +size 443 diff --git a/ppo-lora/checkpoint-4000/training_args.bin b/ppo-lora/checkpoint-4000/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..684a2089f53ed437a099eb02bb62cc1ce00d3664 --- /dev/null +++ b/ppo-lora/checkpoint-4000/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf91d7ac2ddda7e1272b902408951545188f843d4da6b19c2e572a6c86a6075b +size 3274 diff --git a/ppo-lora/checkpoint-4000/value_head.bin b/ppo-lora/checkpoint-4000/value_head.bin new file mode 100644 index 0000000000000000000000000000000000000000..70f0199cf8f33321f817307951b03c5f29af947a --- /dev/null +++ b/ppo-lora/checkpoint-4000/value_head.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fca5a9037d28fec50bc06f7b4768851167c5dbac08df3d6f579c0fc86e67c530 +size 21491 diff --git a/ppo-lora/checkpoint-5000/README.md b/ppo-lora/checkpoint-5000/README.md new file mode 100644 index 0000000000000000000000000000000000000000..d290c902d52b2091d490255d35c9be86df84f437 --- /dev/null +++ b/ppo-lora/checkpoint-5000/README.md @@ -0,0 +1,3 @@ +--- +library_name: peft +--- diff --git a/ppo-lora/checkpoint-5000/adapter_config.json b/ppo-lora/checkpoint-5000/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..2ef4676864a7f782259cd6700dcab8059e8973ab --- /dev/null +++ b/ppo-lora/checkpoint-5000/adapter_config.json @@ -0,0 +1,20 @@ +{ + "base_model_name_or_path": "llama-13b-hf/", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layers_pattern": null, + "layers_to_transform": null, + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "revision": null, + "target_modules": [ + "q_proj", + "v_proj" + ], + "task_type": "CAUSAL_LM" +} \ No newline at end of file diff --git a/ppo-lora/checkpoint-5000/adapter_model.bin b/ppo-lora/checkpoint-5000/adapter_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..c66134ca808ee2dd05d30af858716fe484321997 --- /dev/null +++ b/ppo-lora/checkpoint-5000/adapter_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06839ee491e98e367765e336e05ec2ea6133406f411a33ae8b054c77dddb1513 +size 26269517 diff --git a/ppo-lora/checkpoint-5000/finetuning_args.json b/ppo-lora/checkpoint-5000/finetuning_args.json new file mode 100644 index 0000000000000000000000000000000000000000..36a921b3eb84159ad54e7697e9d7d3e2fde38fec --- /dev/null +++ b/ppo-lora/checkpoint-5000/finetuning_args.json @@ -0,0 +1,13 @@ +{ + "finetuning_type": "lora", + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "lora_rank": 8, + "lora_target": [ + "q_proj", + "v_proj" + ], + "name_module_trainable": "mlp", + "num_hidden_layers": 32, + "num_layer_trainable": 3 +} diff --git a/ppo-lora/checkpoint-5000/reward/adapter_config.json b/ppo-lora/checkpoint-5000/reward/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..2ef4676864a7f782259cd6700dcab8059e8973ab --- /dev/null +++ b/ppo-lora/checkpoint-5000/reward/adapter_config.json @@ -0,0 +1,20 @@ +{ + "base_model_name_or_path": "llama-13b-hf/", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layers_pattern": null, + "layers_to_transform": null, + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "revision": null, + "target_modules": [ + "q_proj", + "v_proj" + ], + "task_type": "CAUSAL_LM" +} \ No newline at end of file diff --git a/ppo-lora/checkpoint-5000/reward/adapter_model.bin b/ppo-lora/checkpoint-5000/reward/adapter_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..8710093665dfdb9819e2f8817a1e25a4ccdd9935 --- /dev/null +++ b/ppo-lora/checkpoint-5000/reward/adapter_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5e1621f48d9ad8feb1d6d31050275f0aafd080c5c07153301fe2f48411f4406 +size 443 diff --git a/ppo-lora/checkpoint-5000/training_args.bin b/ppo-lora/checkpoint-5000/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..684a2089f53ed437a099eb02bb62cc1ce00d3664 --- /dev/null +++ b/ppo-lora/checkpoint-5000/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf91d7ac2ddda7e1272b902408951545188f843d4da6b19c2e572a6c86a6075b +size 3274 diff --git a/ppo-lora/checkpoint-5000/value_head.bin b/ppo-lora/checkpoint-5000/value_head.bin new file mode 100644 index 0000000000000000000000000000000000000000..272f9c41af3d28b0087ef7a69d82889d1e681021 --- /dev/null +++ b/ppo-lora/checkpoint-5000/value_head.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:404a4c61cdfa78d1d30457f1956181a78bd80eb3396e99ef0ed0cc40570d3ea3 +size 21491 diff --git a/ppo-lora/checkpoint-6000/README.md b/ppo-lora/checkpoint-6000/README.md new file mode 100644 index 0000000000000000000000000000000000000000..d290c902d52b2091d490255d35c9be86df84f437 --- /dev/null +++ b/ppo-lora/checkpoint-6000/README.md @@ -0,0 +1,3 @@ +--- +library_name: peft +--- diff --git a/ppo-lora/checkpoint-6000/adapter_config.json b/ppo-lora/checkpoint-6000/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..2ef4676864a7f782259cd6700dcab8059e8973ab --- /dev/null +++ b/ppo-lora/checkpoint-6000/adapter_config.json @@ -0,0 +1,20 @@ +{ + "base_model_name_or_path": "llama-13b-hf/", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layers_pattern": null, + "layers_to_transform": null, + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "revision": null, + "target_modules": [ + "q_proj", + "v_proj" + ], + "task_type": "CAUSAL_LM" +} \ No newline at end of file diff --git a/ppo-lora/checkpoint-6000/adapter_model.bin b/ppo-lora/checkpoint-6000/adapter_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..3546898ce11af6639edb40f34e9d9a2dfa81e305 --- /dev/null +++ b/ppo-lora/checkpoint-6000/adapter_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0424271468f1a8d78da73c08a499c2e6a19aa5df3104bb1f83d462e37d39300e +size 26269517 diff --git a/ppo-lora/checkpoint-6000/finetuning_args.json b/ppo-lora/checkpoint-6000/finetuning_args.json new file mode 100644 index 0000000000000000000000000000000000000000..36a921b3eb84159ad54e7697e9d7d3e2fde38fec --- /dev/null +++ b/ppo-lora/checkpoint-6000/finetuning_args.json @@ -0,0 +1,13 @@ +{ + "finetuning_type": "lora", + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "lora_rank": 8, + "lora_target": [ + "q_proj", + "v_proj" + ], + "name_module_trainable": "mlp", + "num_hidden_layers": 32, + "num_layer_trainable": 3 +} diff --git a/ppo-lora/checkpoint-6000/reward/adapter_config.json b/ppo-lora/checkpoint-6000/reward/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..2ef4676864a7f782259cd6700dcab8059e8973ab --- /dev/null +++ b/ppo-lora/checkpoint-6000/reward/adapter_config.json @@ -0,0 +1,20 @@ +{ + "base_model_name_or_path": "llama-13b-hf/", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layers_pattern": null, + "layers_to_transform": null, + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "revision": null, + "target_modules": [ + "q_proj", + "v_proj" + ], + "task_type": "CAUSAL_LM" +} \ No newline at end of file diff --git a/ppo-lora/checkpoint-6000/reward/adapter_model.bin b/ppo-lora/checkpoint-6000/reward/adapter_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..8710093665dfdb9819e2f8817a1e25a4ccdd9935 --- /dev/null +++ b/ppo-lora/checkpoint-6000/reward/adapter_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5e1621f48d9ad8feb1d6d31050275f0aafd080c5c07153301fe2f48411f4406 +size 443 diff --git a/ppo-lora/checkpoint-6000/training_args.bin b/ppo-lora/checkpoint-6000/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..684a2089f53ed437a099eb02bb62cc1ce00d3664 --- /dev/null +++ b/ppo-lora/checkpoint-6000/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf91d7ac2ddda7e1272b902408951545188f843d4da6b19c2e572a6c86a6075b +size 3274 diff --git a/ppo-lora/checkpoint-6000/value_head.bin b/ppo-lora/checkpoint-6000/value_head.bin new file mode 100644 index 0000000000000000000000000000000000000000..d23af54436c9f647d6928c6766226e5b5d8d870e --- /dev/null +++ b/ppo-lora/checkpoint-6000/value_head.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:979ebda1f42550bcd586d79c224b64a3275688ea06d4c3440e83cb4ffc22b85e +size 21491 diff --git a/ppo-lora/checkpoint-7000/README.md b/ppo-lora/checkpoint-7000/README.md new file mode 100644 index 0000000000000000000000000000000000000000..d290c902d52b2091d490255d35c9be86df84f437 --- /dev/null +++ b/ppo-lora/checkpoint-7000/README.md @@ -0,0 +1,3 @@ +--- +library_name: peft +--- diff --git a/ppo-lora/checkpoint-7000/adapter_config.json b/ppo-lora/checkpoint-7000/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..2ef4676864a7f782259cd6700dcab8059e8973ab --- /dev/null +++ b/ppo-lora/checkpoint-7000/adapter_config.json @@ -0,0 +1,20 @@ +{ + "base_model_name_or_path": "llama-13b-hf/", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layers_pattern": null, + "layers_to_transform": null, + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "revision": null, + "target_modules": [ + "q_proj", + "v_proj" + ], + "task_type": "CAUSAL_LM" +} \ No newline at end of file diff --git a/ppo-lora/checkpoint-7000/adapter_model.bin b/ppo-lora/checkpoint-7000/adapter_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..438924fafc9245728daef5a9498d7145932afc7b --- /dev/null +++ b/ppo-lora/checkpoint-7000/adapter_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:814e8bdf306b4f1c6380b60b28b05463ba02c9d391f91bfba1abb6404c8ffacc +size 26269517 diff --git a/ppo-lora/checkpoint-7000/finetuning_args.json b/ppo-lora/checkpoint-7000/finetuning_args.json new file mode 100644 index 0000000000000000000000000000000000000000..36a921b3eb84159ad54e7697e9d7d3e2fde38fec --- /dev/null +++ b/ppo-lora/checkpoint-7000/finetuning_args.json @@ -0,0 +1,13 @@ +{ + "finetuning_type": "lora", + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "lora_rank": 8, + "lora_target": [ + "q_proj", + "v_proj" + ], + "name_module_trainable": "mlp", + "num_hidden_layers": 32, + "num_layer_trainable": 3 +} diff --git a/ppo-lora/checkpoint-7000/reward/adapter_config.json b/ppo-lora/checkpoint-7000/reward/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..2ef4676864a7f782259cd6700dcab8059e8973ab --- /dev/null +++ b/ppo-lora/checkpoint-7000/reward/adapter_config.json @@ -0,0 +1,20 @@ +{ + "base_model_name_or_path": "llama-13b-hf/", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layers_pattern": null, + "layers_to_transform": null, + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "revision": null, + "target_modules": [ + "q_proj", + "v_proj" + ], + "task_type": "CAUSAL_LM" +} \ No newline at end of file diff --git a/ppo-lora/checkpoint-7000/reward/adapter_model.bin b/ppo-lora/checkpoint-7000/reward/adapter_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..8710093665dfdb9819e2f8817a1e25a4ccdd9935 --- /dev/null +++ b/ppo-lora/checkpoint-7000/reward/adapter_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5e1621f48d9ad8feb1d6d31050275f0aafd080c5c07153301fe2f48411f4406 +size 443 diff --git a/ppo-lora/checkpoint-7000/training_args.bin b/ppo-lora/checkpoint-7000/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..684a2089f53ed437a099eb02bb62cc1ce00d3664 --- /dev/null +++ b/ppo-lora/checkpoint-7000/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf91d7ac2ddda7e1272b902408951545188f843d4da6b19c2e572a6c86a6075b +size 3274 diff --git a/ppo-lora/checkpoint-7000/value_head.bin b/ppo-lora/checkpoint-7000/value_head.bin new file mode 100644 index 0000000000000000000000000000000000000000..05f3a7fedd1367cf23f132776af4aa8be357d18c --- /dev/null +++ b/ppo-lora/checkpoint-7000/value_head.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19d9dc404785b5c7f692696012e114f654ef881e0d4fb2a3a2bd376d63785177 +size 21491 diff --git a/ppo-lora/finetuning_args.json b/ppo-lora/finetuning_args.json new file mode 100644 index 0000000000000000000000000000000000000000..36a921b3eb84159ad54e7697e9d7d3e2fde38fec --- /dev/null +++ b/ppo-lora/finetuning_args.json @@ -0,0 +1,13 @@ +{ + "finetuning_type": "lora", + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "lora_rank": 8, + "lora_target": [ + "q_proj", + "v_proj" + ], + "name_module_trainable": "mlp", + "num_hidden_layers": 32, + "num_layer_trainable": 3 +} diff --git a/ppo-lora/reward/adapter_config.json b/ppo-lora/reward/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..2ef4676864a7f782259cd6700dcab8059e8973ab --- /dev/null +++ b/ppo-lora/reward/adapter_config.json @@ -0,0 +1,20 @@ +{ + "base_model_name_or_path": "llama-13b-hf/", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layers_pattern": null, + "layers_to_transform": null, + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "revision": null, + "target_modules": [ + "q_proj", + "v_proj" + ], + "task_type": "CAUSAL_LM" +} \ No newline at end of file diff --git a/ppo-lora/reward/adapter_model.bin b/ppo-lora/reward/adapter_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..8710093665dfdb9819e2f8817a1e25a4ccdd9935 --- /dev/null +++ b/ppo-lora/reward/adapter_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5e1621f48d9ad8feb1d6d31050275f0aafd080c5c07153301fe2f48411f4406 +size 443 diff --git a/ppo-lora/trainer_log.jsonl b/ppo-lora/trainer_log.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..77d18d3d5daf965002e35260c4f4d9c9013a4c7b --- /dev/null +++ b/ppo-lora/trainer_log.jsonl @@ -0,0 +1,706 @@ +{"current_steps": 9, "total_steps": 7063, "loss": 0.0058, "reward": -0.5258, "learning_rate": 9.999359182892298e-06, "epoch": 0.0, "percentage": 0.13, "elapsed_time": "0:03:43", "remaining_time": "2 days, 0:43:37"} +{"current_steps": 19, "total_steps": 7063, "loss": 0.0053, "reward": -0.5235, "learning_rate": 9.997144223525905e-06, "epoch": 0.0, "percentage": 0.27, "elapsed_time": "0:07:18", "remaining_time": "1 day, 21:09:33"} +{"current_steps": 29, "total_steps": 7063, "loss": 0.0063, "reward": -0.5422, "learning_rate": 9.993347911338379e-06, "epoch": 0.0, "percentage": 0.41, "elapsed_time": "0:10:53", "remaining_time": "1 day, 20:02:39"} +{"current_steps": 39, "total_steps": 7063, "loss": 0.0052, "reward": -0.5766, "learning_rate": 9.987971447677674e-06, "epoch": 0.01, "percentage": 0.55, "elapsed_time": "0:14:29", "remaining_time": "1 day, 19:30:27"} +{"current_steps": 49, "total_steps": 7063, "loss": 0.0042, "reward": -0.3694, "learning_rate": 9.981016533932741e-06, "epoch": 0.01, "percentage": 0.69, "elapsed_time": "0:18:08", "remaining_time": "1 day, 19:17:34"} +{"current_steps": 59, "total_steps": 7063, "loss": 0.004, "reward": -0.346, "learning_rate": 9.972485370995129e-06, "epoch": 0.01, "percentage": 0.84, "elapsed_time": "0:21:40", "remaining_time": "1 day, 18:53:25"} +{"current_steps": 69, "total_steps": 7063, "loss": 0.0047, "reward": -0.4197, "learning_rate": 9.962380658562499e-06, "epoch": 0.01, "percentage": 0.98, "elapsed_time": "0:25:25", "remaining_time": "1 day, 18:57:25"} +{"current_steps": 79, "total_steps": 7063, "loss": 0.0043, "reward": -0.1848, "learning_rate": 9.950705594284304e-06, "epoch": 0.01, "percentage": 1.12, "elapsed_time": "0:29:01", "remaining_time": "1 day, 18:46:16"} +{"current_steps": 89, "total_steps": 7063, "loss": 0.0046, "reward": -0.4406, "learning_rate": 9.937463872749902e-06, "epoch": 0.01, "percentage": 1.26, "elapsed_time": "0:32:36", "remaining_time": "1 day, 18:35:00"} +{"current_steps": 99, "total_steps": 7063, "loss": 0.0044, "reward": -0.4997, "learning_rate": 9.922659684319374e-06, "epoch": 0.01, "percentage": 1.4, "elapsed_time": "0:36:15", "remaining_time": "1 day, 18:30:31"} +{"current_steps": 109, "total_steps": 7063, "loss": 0.0048, "reward": -0.4274, "learning_rate": 9.906297713797501e-06, "epoch": 0.02, "percentage": 1.54, "elapsed_time": "0:39:54", "remaining_time": "1 day, 18:25:56"} +{"current_steps": 119, "total_steps": 7063, "loss": 0.0046, "reward": -0.3451, "learning_rate": 9.888383138951242e-06, "epoch": 0.02, "percentage": 1.68, "elapsed_time": "0:43:16", "remaining_time": "1 day, 18:04:52"} +{"current_steps": 129, "total_steps": 7063, "loss": 0.0051, "reward": -0.4131, "learning_rate": 9.868921628871223e-06, "epoch": 0.02, "percentage": 1.83, "elapsed_time": "0:47:07", "remaining_time": "1 day, 18:12:39"} +{"current_steps": 139, "total_steps": 7063, "loss": 0.004, "reward": -0.2998, "learning_rate": 9.847919342177744e-06, "epoch": 0.02, "percentage": 1.97, "elapsed_time": "0:50:39", "remaining_time": "1 day, 18:03:25"} +{"current_steps": 149, "total_steps": 7063, "loss": 0.0045, "reward": -0.4068, "learning_rate": 9.825382925071883e-06, "epoch": 0.02, "percentage": 2.11, "elapsed_time": "0:54:19", "remaining_time": "1 day, 18:00:28"} +{"current_steps": 159, "total_steps": 7063, "loss": 0.0051, "reward": -0.4744, "learning_rate": 9.801319509232287e-06, "epoch": 0.02, "percentage": 2.25, "elapsed_time": "0:57:55", "remaining_time": "1 day, 17:54:51"} +{"current_steps": 169, "total_steps": 7063, "loss": 0.0054, "reward": -0.5511, "learning_rate": 9.775736709558352e-06, "epoch": 0.02, "percentage": 2.39, "elapsed_time": "1:01:19", "remaining_time": "1 day, 17:41:45"} +{"current_steps": 179, "total_steps": 7063, "loss": 0.0055, "reward": -0.2605, "learning_rate": 9.748642621760474e-06, "epoch": 0.03, "percentage": 2.53, "elapsed_time": "1:05:00", "remaining_time": "1 day, 17:39:59"} +{"current_steps": 189, "total_steps": 7063, "loss": 0.0043, "reward": -0.4817, "learning_rate": 9.720045819798151e-06, "epoch": 0.03, "percentage": 2.68, "elapsed_time": "1:08:36", "remaining_time": "1 day, 17:35:15"} +{"current_steps": 199, "total_steps": 7063, "loss": 0.0061, "reward": -0.3717, "learning_rate": 9.68995535316674e-06, "epoch": 0.03, "percentage": 2.82, "elapsed_time": "1:12:14", "remaining_time": "1 day, 17:31:54"} +{"current_steps": 209, "total_steps": 7063, "loss": 0.0041, "reward": -0.3632, "learning_rate": 9.658380744033737e-06, "epoch": 0.03, "percentage": 2.96, "elapsed_time": "1:15:41", "remaining_time": "1 day, 17:22:21"} +{"current_steps": 219, "total_steps": 7063, "loss": 0.0039, "reward": -0.4044, "learning_rate": 9.625331984225475e-06, "epoch": 0.03, "percentage": 3.1, "elapsed_time": "1:19:14", "remaining_time": "1 day, 17:16:32"} +{"current_steps": 229, "total_steps": 7063, "loss": 0.0049, "reward": -0.3763, "learning_rate": 9.590819532065188e-06, "epoch": 0.03, "percentage": 3.24, "elapsed_time": "1:22:57", "remaining_time": "1 day, 17:15:53"} +{"current_steps": 239, "total_steps": 7063, "loss": 0.0053, "reward": -0.3172, "learning_rate": 9.554854309063474e-06, "epoch": 0.03, "percentage": 3.38, "elapsed_time": "1:26:31", "remaining_time": "1 day, 17:10:29"} +{"current_steps": 249, "total_steps": 7063, "loss": 0.0047, "reward": -0.5815, "learning_rate": 9.517447696462163e-06, "epoch": 0.04, "percentage": 3.53, "elapsed_time": "1:30:03", "remaining_time": "1 day, 17:04:26"} +{"current_steps": 259, "total_steps": 7063, "loss": 0.0048, "reward": -0.35, "learning_rate": 9.478611531632702e-06, "epoch": 0.04, "percentage": 3.67, "elapsed_time": "1:33:33", "remaining_time": "1 day, 16:57:39"} +{"current_steps": 269, "total_steps": 7063, "loss": 0.0054, "reward": -0.4544, "learning_rate": 9.438358104330215e-06, "epoch": 0.04, "percentage": 3.81, "elapsed_time": "1:37:05", "remaining_time": "1 day, 16:52:06"} +{"current_steps": 279, "total_steps": 7063, "loss": 0.0039, "reward": -0.3515, "learning_rate": 9.396700152804386e-06, "epoch": 0.04, "percentage": 3.95, "elapsed_time": "1:40:38", "remaining_time": "1 day, 16:47:02"} +{"current_steps": 289, "total_steps": 7063, "loss": 0.0052, "reward": -0.3799, "learning_rate": 9.353650859768423e-06, "epoch": 0.04, "percentage": 4.09, "elapsed_time": "1:44:11", "remaining_time": "1 day, 16:42:08"} +{"current_steps": 299, "total_steps": 7063, "loss": 0.0048, "reward": -0.5378, "learning_rate": 9.309223848227377e-06, "epoch": 0.04, "percentage": 4.23, "elapsed_time": "1:47:47", "remaining_time": "1 day, 16:38:28"} +{"current_steps": 309, "total_steps": 7063, "loss": 0.0057, "reward": -0.4758, "learning_rate": 9.26343317716712e-06, "epoch": 0.04, "percentage": 4.37, "elapsed_time": "1:51:32", "remaining_time": "1 day, 16:38:03"} +{"current_steps": 319, "total_steps": 7063, "loss": 0.0044, "reward": -0.5203, "learning_rate": 9.216293337105358e-06, "epoch": 0.05, "percentage": 4.52, "elapsed_time": "1:55:03", "remaining_time": "1 day, 16:32:28"} +{"current_steps": 329, "total_steps": 7063, "loss": 0.0054, "reward": -0.5237, "learning_rate": 9.167819245506095e-06, "epoch": 0.05, "percentage": 4.66, "elapsed_time": "1:58:32", "remaining_time": "1 day, 16:26:10"} +{"current_steps": 339, "total_steps": 7063, "loss": 0.0058, "reward": -0.2535, "learning_rate": 9.118026242058976e-06, "epoch": 0.05, "percentage": 4.8, "elapsed_time": "2:02:07", "remaining_time": "1 day, 16:22:11"} +{"current_steps": 349, "total_steps": 7063, "loss": 0.0067, "reward": -0.5059, "learning_rate": 9.066930083825025e-06, "epoch": 0.05, "percentage": 4.94, "elapsed_time": "2:05:46", "remaining_time": "1 day, 16:19:34"} +{"current_steps": 359, "total_steps": 7063, "loss": 0.0059, "reward": -0.5255, "learning_rate": 9.014546940250301e-06, "epoch": 0.05, "percentage": 5.08, "elapsed_time": "2:09:12", "remaining_time": "1 day, 16:12:57"} +{"current_steps": 369, "total_steps": 7063, "loss": 0.0047, "reward": -0.3411, "learning_rate": 8.960893388049056e-06, "epoch": 0.05, "percentage": 5.22, "elapsed_time": "2:12:40", "remaining_time": "1 day, 16:06:45"} +{"current_steps": 379, "total_steps": 7063, "loss": 0.0048, "reward": -0.3859, "learning_rate": 8.905986405958015e-06, "epoch": 0.05, "percentage": 5.37, "elapsed_time": "2:16:05", "remaining_time": "1 day, 16:00:09"} +{"current_steps": 389, "total_steps": 7063, "loss": 0.0058, "reward": -0.3785, "learning_rate": 8.849843369363425e-06, "epoch": 0.06, "percentage": 5.51, "elapsed_time": "2:19:37", "remaining_time": "1 day, 15:55:37"} +{"current_steps": 399, "total_steps": 7063, "loss": 0.0047, "reward": -0.3432, "learning_rate": 8.792482044802602e-06, "epoch": 0.06, "percentage": 5.65, "elapsed_time": "2:23:18", "remaining_time": "1 day, 15:53:35"} +{"current_steps": 409, "total_steps": 7063, "loss": 0.0057, "reward": -0.3958, "learning_rate": 8.733920584341673e-06, "epoch": 0.06, "percentage": 5.79, "elapsed_time": "2:26:51", "remaining_time": "1 day, 15:49:11"} +{"current_steps": 419, "total_steps": 7063, "loss": 0.0049, "reward": -0.4713, "learning_rate": 8.674177519831351e-06, "epoch": 0.06, "percentage": 5.93, "elapsed_time": "2:30:34", "remaining_time": "1 day, 15:47:35"} +{"current_steps": 429, "total_steps": 7063, "loss": 0.0048, "reward": -0.4485, "learning_rate": 8.613271757042483e-06, "epoch": 0.06, "percentage": 6.07, "elapsed_time": "2:34:19", "remaining_time": "1 day, 15:46:31"} +{"current_steps": 439, "total_steps": 7063, "loss": 0.0054, "reward": -0.5861, "learning_rate": 8.551222569683315e-06, "epoch": 0.06, "percentage": 6.22, "elapsed_time": "2:37:59", "remaining_time": "1 day, 15:43:55"} +{"current_steps": 449, "total_steps": 7063, "loss": 0.0052, "reward": -0.292, "learning_rate": 8.488049593300287e-06, "epoch": 0.06, "percentage": 6.36, "elapsed_time": "2:41:28", "remaining_time": "1 day, 15:38:38"} +{"current_steps": 459, "total_steps": 7063, "loss": 0.0049, "reward": -0.4702, "learning_rate": 8.423772819064349e-06, "epoch": 0.06, "percentage": 6.5, "elapsed_time": "2:45:03", "remaining_time": "1 day, 15:34:42"} +{"current_steps": 469, "total_steps": 7063, "loss": 0.0053, "reward": -0.5542, "learning_rate": 8.358412587444719e-06, "epoch": 0.07, "percentage": 6.64, "elapsed_time": "2:48:51", "remaining_time": "1 day, 15:34:10"} +{"current_steps": 479, "total_steps": 7063, "loss": 0.0048, "reward": -0.4116, "learning_rate": 8.291989581772126e-06, "epoch": 0.07, "percentage": 6.78, "elapsed_time": "2:52:22", "remaining_time": "1 day, 15:29:14"} +{"current_steps": 489, "total_steps": 7063, "loss": 0.005, "reward": -0.3746, "learning_rate": 8.224524821693534e-06, "epoch": 0.07, "percentage": 6.92, "elapsed_time": "2:55:51", "remaining_time": "1 day, 15:24:06"} +{"current_steps": 499, "total_steps": 7063, "loss": 0.0046, "reward": -0.4481, "learning_rate": 8.156039656520448e-06, "epoch": 0.07, "percentage": 7.06, "elapsed_time": "2:59:39", "remaining_time": "1 day, 15:23:13"} +{"current_steps": 509, "total_steps": 7063, "loss": 0.0043, "reward": -0.4127, "learning_rate": 8.086555758472905e-06, "epoch": 0.07, "percentage": 7.21, "elapsed_time": "3:03:18", "remaining_time": "1 day, 15:20:17"} +{"current_steps": 519, "total_steps": 7063, "loss": 0.0069, "reward": -0.5597, "learning_rate": 8.016095115821258e-06, "epoch": 0.07, "percentage": 7.35, "elapsed_time": "3:06:52", "remaining_time": "1 day, 15:16:22"} +{"current_steps": 529, "total_steps": 7063, "loss": 0.0061, "reward": -0.4318, "learning_rate": 7.944680025927976e-06, "epoch": 0.07, "percentage": 7.49, "elapsed_time": "3:10:29", "remaining_time": "1 day, 15:12:51"} +{"current_steps": 539, "total_steps": 7063, "loss": 0.0045, "reward": -0.3063, "learning_rate": 7.872333088191598e-06, "epoch": 0.08, "percentage": 7.63, "elapsed_time": "3:13:58", "remaining_time": "1 day, 15:07:45"} +{"current_steps": 549, "total_steps": 7063, "loss": 0.0048, "reward": -0.3184, "learning_rate": 7.799077196895131e-06, "epoch": 0.08, "percentage": 7.77, "elapsed_time": "3:17:42", "remaining_time": "1 day, 15:05:47"} +{"current_steps": 559, "total_steps": 7063, "loss": 0.0058, "reward": -0.476, "learning_rate": 7.724935533961129e-06, "epoch": 0.08, "percentage": 7.91, "elapsed_time": "3:21:19", "remaining_time": "1 day, 15:02:21"} +{"current_steps": 569, "total_steps": 7063, "loss": 0.0051, "reward": -0.3959, "learning_rate": 7.649931561615733e-06, "epoch": 0.08, "percentage": 8.06, "elapsed_time": "3:24:50", "remaining_time": "1 day, 14:57:56"} +{"current_steps": 579, "total_steps": 7063, "loss": 0.0051, "reward": -0.4472, "learning_rate": 7.574089014964029e-06, "epoch": 0.08, "percentage": 8.2, "elapsed_time": "3:28:20", "remaining_time": "1 day, 14:53:10"} +{"current_steps": 589, "total_steps": 7063, "loss": 0.0058, "reward": -0.3736, "learning_rate": 7.497431894479034e-06, "epoch": 0.08, "percentage": 8.34, "elapsed_time": "3:31:59", "remaining_time": "1 day, 14:50:11"} +{"current_steps": 599, "total_steps": 7063, "loss": 0.0043, "reward": -0.4911, "learning_rate": 7.419984458406722e-06, "epoch": 0.08, "percentage": 8.48, "elapsed_time": "3:35:35", "remaining_time": "1 day, 14:46:30"} +{"current_steps": 609, "total_steps": 7063, "loss": 0.005, "reward": -0.3037, "learning_rate": 7.341771215089468e-06, "epoch": 0.09, "percentage": 8.62, "elapsed_time": "3:39:18", "remaining_time": "1 day, 14:44:09"} +{"current_steps": 619, "total_steps": 7063, "loss": 0.0062, "reward": -0.4219, "learning_rate": 7.26281691521035e-06, "epoch": 0.09, "percentage": 8.76, "elapsed_time": "3:42:46", "remaining_time": "1 day, 14:39:05"} +{"current_steps": 629, "total_steps": 7063, "loss": 0.0051, "reward": -0.3435, "learning_rate": 7.183146543960761e-06, "epoch": 0.09, "percentage": 8.91, "elapsed_time": "3:46:23", "remaining_time": "1 day, 14:35:43"} +{"current_steps": 639, "total_steps": 7063, "loss": 0.0038, "reward": -0.3745, "learning_rate": 7.102785313133821e-06, "epoch": 0.09, "percentage": 9.05, "elapsed_time": "3:50:06", "remaining_time": "1 day, 14:33:17"} +{"current_steps": 649, "total_steps": 7063, "loss": 0.0053, "reward": -0.3743, "learning_rate": 7.021758653146058e-06, "epoch": 0.09, "percentage": 9.19, "elapsed_time": "3:53:36", "remaining_time": "1 day, 14:28:39"} +{"current_steps": 659, "total_steps": 7063, "loss": 0.006, "reward": -0.4696, "learning_rate": 6.940092204989934e-06, "epoch": 0.09, "percentage": 9.33, "elapsed_time": "3:57:18", "remaining_time": "1 day, 14:26:10"} +{"current_steps": 669, "total_steps": 7063, "loss": 0.0058, "reward": -0.4343, "learning_rate": 6.8578118121197144e-06, "epoch": 0.09, "percentage": 9.47, "elapsed_time": "4:00:55", "remaining_time": "1 day, 14:22:40"} +{"current_steps": 679, "total_steps": 7063, "loss": 0.0044, "reward": -0.2842, "learning_rate": 6.774943512273267e-06, "epoch": 0.1, "percentage": 9.61, "elapsed_time": "4:04:32", "remaining_time": "1 day, 14:19:07"} +{"current_steps": 689, "total_steps": 7063, "loss": 0.0046, "reward": -0.345, "learning_rate": 6.691513529232391e-06, "epoch": 0.1, "percentage": 9.76, "elapsed_time": "4:08:13", "remaining_time": "1 day, 14:16:18"} +{"current_steps": 699, "total_steps": 7063, "loss": 0.0047, "reward": -0.3973, "learning_rate": 6.607548264524268e-06, "epoch": 0.1, "percentage": 9.9, "elapsed_time": "4:11:46", "remaining_time": "1 day, 14:12:19"} +{"current_steps": 709, "total_steps": 7063, "loss": 0.0039, "reward": -0.3412, "learning_rate": 6.523074289066666e-06, "epoch": 0.1, "percentage": 10.04, "elapsed_time": "4:15:18", "remaining_time": "1 day, 14:07:59"} +{"current_steps": 719, "total_steps": 7063, "loss": 0.0054, "reward": -0.3593, "learning_rate": 6.43811833475953e-06, "epoch": 0.1, "percentage": 10.18, "elapsed_time": "4:18:57", "remaining_time": "1 day, 14:04:53"} +{"current_steps": 729, "total_steps": 7063, "loss": 0.0049, "reward": -0.3673, "learning_rate": 6.352707286025644e-06, "epoch": 0.1, "percentage": 10.32, "elapsed_time": "4:22:32", "remaining_time": "1 day, 14:01:08"} +{"current_steps": 739, "total_steps": 7063, "loss": 0.0046, "reward": -0.4224, "learning_rate": 6.266868171303017e-06, "epoch": 0.1, "percentage": 10.46, "elapsed_time": "4:26:08", "remaining_time": "1 day, 13:57:33"} +{"current_steps": 749, "total_steps": 7063, "loss": 0.0045, "reward": -0.1521, "learning_rate": 6.1806281544917e-06, "epoch": 0.11, "percentage": 10.6, "elapsed_time": "4:29:47", "remaining_time": "1 day, 13:54:20"} +{"current_steps": 759, "total_steps": 7063, "loss": 0.0056, "reward": -0.3997, "learning_rate": 6.094014526357734e-06, "epoch": 0.11, "percentage": 10.75, "elapsed_time": "4:33:15", "remaining_time": "1 day, 13:49:36"} +{"current_steps": 769, "total_steps": 7063, "loss": 0.0046, "reward": -0.289, "learning_rate": 6.007054695896955e-06, "epoch": 0.11, "percentage": 10.89, "elapsed_time": "4:36:51", "remaining_time": "1 day, 13:45:55"} +{"current_steps": 779, "total_steps": 7063, "loss": 0.0042, "reward": -0.3431, "learning_rate": 5.9197761816613705e-06, "epoch": 0.11, "percentage": 11.03, "elapsed_time": "4:40:29", "remaining_time": "1 day, 13:42:41"} +{"current_steps": 789, "total_steps": 7063, "loss": 0.0049, "reward": -0.3222, "learning_rate": 5.8322066030508924e-06, "epoch": 0.11, "percentage": 11.17, "elapsed_time": "4:44:04", "remaining_time": "1 day, 13:38:55"} +{"current_steps": 799, "total_steps": 7063, "loss": 0.0055, "reward": -0.4949, "learning_rate": 5.74437367157313e-06, "epoch": 0.11, "percentage": 11.31, "elapsed_time": "4:47:42", "remaining_time": "1 day, 13:35:31"} +{"current_steps": 809, "total_steps": 7063, "loss": 0.0065, "reward": -0.4194, "learning_rate": 5.656305182074053e-06, "epoch": 0.11, "percentage": 11.45, "elapsed_time": "4:51:16", "remaining_time": "1 day, 13:31:40"} +{"current_steps": 819, "total_steps": 7063, "loss": 0.005, "reward": -0.5284, "learning_rate": 5.568029003942271e-06, "epoch": 0.12, "percentage": 11.6, "elapsed_time": "4:54:55", "remaining_time": "1 day, 13:28:27"} +{"current_steps": 829, "total_steps": 7063, "loss": 0.0058, "reward": -0.5156, "learning_rate": 5.4795730722897435e-06, "epoch": 0.12, "percentage": 11.74, "elapsed_time": "4:58:25", "remaining_time": "1 day, 13:24:05"} +{"current_steps": 839, "total_steps": 7063, "loss": 0.0043, "reward": -0.3164, "learning_rate": 5.390965379111655e-06, "epoch": 0.12, "percentage": 11.88, "elapsed_time": "5:02:04", "remaining_time": "1 day, 13:20:56"} +{"current_steps": 849, "total_steps": 7063, "loss": 0.004, "reward": -0.1936, "learning_rate": 5.302233964428329e-06, "epoch": 0.12, "percentage": 12.02, "elapsed_time": "5:05:45", "remaining_time": "1 day, 13:17:57"} +{"current_steps": 859, "total_steps": 7063, "loss": 0.0039, "reward": -0.2792, "learning_rate": 5.213406907411921e-06, "epoch": 0.12, "percentage": 12.16, "elapsed_time": "5:09:24", "remaining_time": "1 day, 13:14:40"} +{"current_steps": 869, "total_steps": 7063, "loss": 0.005, "reward": -0.2348, "learning_rate": 5.124512317500723e-06, "epoch": 0.12, "percentage": 12.3, "elapsed_time": "5:13:00", "remaining_time": "1 day, 13:11:02"} +{"current_steps": 879, "total_steps": 7063, "loss": 0.0042, "reward": -0.3528, "learning_rate": 5.035578325503908e-06, "epoch": 0.12, "percentage": 12.45, "elapsed_time": "5:16:36", "remaining_time": "1 day, 13:07:24"} +{"current_steps": 889, "total_steps": 7063, "loss": 0.005, "reward": -0.3753, "learning_rate": 4.946633074699485e-06, "epoch": 0.13, "percentage": 12.59, "elapsed_time": "5:20:11", "remaining_time": "1 day, 13:03:38"} +{"current_steps": 899, "total_steps": 7063, "loss": 0.0052, "reward": -0.4383, "learning_rate": 4.857704711928325e-06, "epoch": 0.13, "percentage": 12.73, "elapsed_time": "5:23:47", "remaining_time": "1 day, 13:00:06"} +{"current_steps": 909, "total_steps": 7063, "loss": 0.0045, "reward": -0.3664, "learning_rate": 4.768821378687066e-06, "epoch": 0.13, "percentage": 12.87, "elapsed_time": "5:27:17", "remaining_time": "1 day, 12:55:49"} +{"current_steps": 919, "total_steps": 7063, "loss": 0.0043, "reward": -0.3584, "learning_rate": 4.6800112022226865e-06, "epoch": 0.13, "percentage": 13.01, "elapsed_time": "5:30:41", "remaining_time": "1 day, 12:50:51"} +{"current_steps": 929, "total_steps": 7063, "loss": 0.0048, "reward": -0.455, "learning_rate": 4.591302286631612e-06, "epoch": 0.13, "percentage": 13.15, "elapsed_time": "5:34:19", "remaining_time": "1 day, 12:47:29"} +{"current_steps": 939, "total_steps": 7063, "loss": 0.004, "reward": -0.3906, "learning_rate": 4.502722703966126e-06, "epoch": 0.13, "percentage": 13.29, "elapsed_time": "5:37:55", "remaining_time": "1 day, 12:43:53"} +{"current_steps": 949, "total_steps": 7063, "loss": 0.0046, "reward": -0.4897, "learning_rate": 4.414300485350945e-06, "epoch": 0.13, "percentage": 13.44, "elapsed_time": "5:41:27", "remaining_time": "1 day, 12:39:54"} +{"current_steps": 959, "total_steps": 7063, "loss": 0.0042, "reward": -0.384, "learning_rate": 4.326063612112721e-06, "epoch": 0.14, "percentage": 13.58, "elapsed_time": "5:45:11", "remaining_time": "1 day, 12:37:09"} +{"current_steps": 969, "total_steps": 7063, "loss": 0.0039, "reward": -0.4159, "learning_rate": 4.2380400069253255e-06, "epoch": 0.14, "percentage": 13.72, "elapsed_time": "5:48:43", "remaining_time": "1 day, 12:33:06"} +{"current_steps": 979, "total_steps": 7063, "loss": 0.0048, "reward": -0.4036, "learning_rate": 4.15025752497367e-06, "epoch": 0.14, "percentage": 13.86, "elapsed_time": "5:52:18", "remaining_time": "1 day, 12:29:22"} +{"current_steps": 989, "total_steps": 7063, "loss": 0.0042, "reward": -0.4189, "learning_rate": 4.062743945138906e-06, "epoch": 0.14, "percentage": 14.0, "elapsed_time": "5:55:52", "remaining_time": "1 day, 12:25:39"} +{"current_steps": 999, "total_steps": 7063, "loss": 0.005, "reward": -0.2446, "learning_rate": 3.975526961207759e-06, "epoch": 0.14, "percentage": 14.14, "elapsed_time": "5:59:16", "remaining_time": "1 day, 12:20:47"} +{"current_steps": 1009, "total_steps": 7063, "loss": 0.0047, "reward": -0.3705, "learning_rate": 3.88863417310879e-06, "epoch": 0.14, "percentage": 14.29, "elapsed_time": "6:02:53", "remaining_time": "1 day, 12:17:23"} +{"current_steps": 1019, "total_steps": 7063, "loss": 0.0048, "reward": -0.3862, "learning_rate": 3.8020930781783704e-06, "epoch": 0.14, "percentage": 14.43, "elapsed_time": "6:06:28", "remaining_time": "1 day, 12:13:41"} +{"current_steps": 1029, "total_steps": 7063, "loss": 0.0041, "reward": -0.4077, "learning_rate": 3.7159310624591055e-06, "epoch": 0.15, "percentage": 14.57, "elapsed_time": "6:10:05", "remaining_time": "1 day, 12:10:11"} +{"current_steps": 1039, "total_steps": 7063, "loss": 0.0072, "reward": -0.2784, "learning_rate": 3.630175392033488e-06, "epoch": 0.15, "percentage": 14.71, "elapsed_time": "6:13:38", "remaining_time": "1 day, 12:06:19"} +{"current_steps": 1049, "total_steps": 7063, "loss": 0.0058, "reward": -0.436, "learning_rate": 3.544853204395513e-06, "epoch": 0.15, "percentage": 14.85, "elapsed_time": "6:17:01", "remaining_time": "1 day, 12:01:30"} +{"current_steps": 1059, "total_steps": 7063, "loss": 0.0045, "reward": -0.3979, "learning_rate": 3.45999149986298e-06, "epoch": 0.15, "percentage": 14.99, "elapsed_time": "6:20:40", "remaining_time": "1 day, 11:58:16"} +{"current_steps": 1069, "total_steps": 7063, "loss": 0.0055, "reward": -0.4709, "learning_rate": 3.375617133033209e-06, "epoch": 0.15, "percentage": 15.14, "elapsed_time": "6:24:12", "remaining_time": "1 day, 11:54:18"} +{"current_steps": 1079, "total_steps": 7063, "loss": 0.0036, "reward": -0.3748, "learning_rate": 3.2917568042848648e-06, "epoch": 0.15, "percentage": 15.28, "elapsed_time": "6:27:46", "remaining_time": "1 day, 11:50:34"} +{"current_steps": 1089, "total_steps": 7063, "loss": 0.0057, "reward": -0.586, "learning_rate": 3.2167439478854534e-06, "epoch": 0.15, "percentage": 15.42, "elapsed_time": "6:31:30", "remaining_time": "1 day, 11:47:43"} +{"current_steps": 1099, "total_steps": 7063, "loss": 0.0047, "reward": -0.2301, "learning_rate": 3.1339332616713215e-06, "epoch": 0.16, "percentage": 15.56, "elapsed_time": "6:35:15", "remaining_time": "1 day, 11:44:55"} +{"current_steps": 1109, "total_steps": 7063, "loss": 0.0052, "reward": -0.4129, "learning_rate": 3.051713094715606e-06, "epoch": 0.16, "percentage": 15.7, "elapsed_time": "6:38:45", "remaining_time": "1 day, 11:40:49"} +{"current_steps": 1119, "total_steps": 7063, "loss": 0.0044, "reward": -0.2389, "learning_rate": 2.9701094656976084e-06, "epoch": 0.16, "percentage": 15.84, "elapsed_time": "6:42:26", "remaining_time": "1 day, 11:37:44"} +{"current_steps": 1129, "total_steps": 7063, "loss": 0.0039, "reward": -0.3641, "learning_rate": 2.8891481981923897e-06, "epoch": 0.16, "percentage": 15.98, "elapsed_time": "6:46:05", "remaining_time": "1 day, 11:34:24"} +{"current_steps": 1139, "total_steps": 7063, "loss": 0.0052, "reward": -0.3099, "learning_rate": 2.8088549124988785e-06, "epoch": 0.16, "percentage": 16.13, "elapsed_time": "6:49:39", "remaining_time": "1 day, 11:30:40"} +{"current_steps": 1149, "total_steps": 7063, "loss": 0.0037, "reward": -0.3203, "learning_rate": 2.729255017532277e-06, "epoch": 0.16, "percentage": 16.27, "elapsed_time": "6:53:18", "remaining_time": "1 day, 11:27:17"} +{"current_steps": 1159, "total_steps": 7063, "loss": 0.0052, "reward": -0.4073, "learning_rate": 2.6503737027833926e-06, "epoch": 0.16, "percentage": 16.41, "elapsed_time": "6:57:01", "remaining_time": "1 day, 11:24:20"} +{"current_steps": 1169, "total_steps": 7063, "loss": 0.0052, "reward": -0.3275, "learning_rate": 2.5722359303473778e-06, "epoch": 0.17, "percentage": 16.55, "elapsed_time": "7:00:25", "remaining_time": "1 day, 11:19:45"} +{"current_steps": 1179, "total_steps": 7063, "loss": 0.004, "reward": -0.3811, "learning_rate": 2.494866427024452e-06, "epoch": 0.17, "percentage": 16.69, "elapsed_time": "7:03:55", "remaining_time": "1 day, 11:15:42"} +{"current_steps": 1189, "total_steps": 7063, "loss": 0.0052, "reward": -0.3413, "learning_rate": 2.4182896764950726e-06, "epoch": 0.17, "percentage": 16.83, "elapsed_time": "7:07:31", "remaining_time": "1 day, 11:12:03"} +{"current_steps": 1199, "total_steps": 7063, "loss": 0.0052, "reward": -0.5202, "learning_rate": 2.3425299115720295e-06, "epoch": 0.17, "percentage": 16.98, "elapsed_time": "7:11:04", "remaining_time": "1 day, 11:08:17"} +{"current_steps": 1209, "total_steps": 7063, "loss": 0.0048, "reward": -0.3018, "learning_rate": 2.267611106531961e-06, "epoch": 0.17, "percentage": 17.12, "elapsed_time": "7:14:49", "remaining_time": "1 day, 11:05:27"} +{"current_steps": 1219, "total_steps": 7063, "loss": 0.0056, "reward": -0.4154, "learning_rate": 2.193556969528642e-06, "epoch": 0.17, "percentage": 17.26, "elapsed_time": "7:18:32", "remaining_time": "1 day, 11:02:24"} +{"current_steps": 1229, "total_steps": 7063, "loss": 0.0046, "reward": -0.3844, "learning_rate": 2.1203909350905215e-06, "epoch": 0.17, "percentage": 17.4, "elapsed_time": "7:22:10", "remaining_time": "1 day, 10:58:56"} +{"current_steps": 1239, "total_steps": 7063, "loss": 0.0052, "reward": -0.3442, "learning_rate": 2.048136156704833e-06, "epoch": 0.18, "percentage": 17.54, "elapsed_time": "7:25:44", "remaining_time": "1 day, 10:55:14"} +{"current_steps": 1249, "total_steps": 7063, "loss": 0.0053, "reward": -0.357, "learning_rate": 1.9768154994906352e-06, "epoch": 0.18, "percentage": 17.68, "elapsed_time": "7:29:12", "remaining_time": "1 day, 10:51:03"} +{"current_steps": 1259, "total_steps": 7063, "loss": 0.0043, "reward": -0.2778, "learning_rate": 1.9064515329631267e-06, "epoch": 0.18, "percentage": 17.83, "elapsed_time": "7:32:49", "remaining_time": "1 day, 10:47:31"} +{"current_steps": 1269, "total_steps": 7063, "loss": 0.0066, "reward": -0.3448, "learning_rate": 1.837066523891483e-06, "epoch": 0.18, "percentage": 17.97, "elapsed_time": "7:36:09", "remaining_time": "1 day, 10:42:42"} +{"current_steps": 1279, "total_steps": 7063, "loss": 0.0051, "reward": -0.3787, "learning_rate": 1.768682429252519e-06, "epoch": 0.18, "percentage": 18.11, "elapsed_time": "7:39:38", "remaining_time": "1 day, 10:38:36"} +{"current_steps": 1289, "total_steps": 7063, "loss": 0.004, "reward": -0.4296, "learning_rate": 1.7013208892823618e-06, "epoch": 0.18, "percentage": 18.25, "elapsed_time": "7:43:17", "remaining_time": "1 day, 10:35:15"} +{"current_steps": 1299, "total_steps": 7063, "loss": 0.0047, "reward": -0.5144, "learning_rate": 1.6350032206283833e-06, "epoch": 0.18, "percentage": 18.39, "elapsed_time": "7:46:50", "remaining_time": "1 day, 10:31:29"} +{"current_steps": 1309, "total_steps": 7063, "loss": 0.0052, "reward": -0.331, "learning_rate": 1.5697504096035116e-06, "epoch": 0.19, "percentage": 18.53, "elapsed_time": "7:50:28", "remaining_time": "1 day, 10:28:03"} +{"current_steps": 1319, "total_steps": 7063, "loss": 0.0039, "reward": -0.3365, "learning_rate": 1.5055831055450825e-06, "epoch": 0.19, "percentage": 18.67, "elapsed_time": "7:53:57", "remaining_time": "1 day, 10:23:58"} +{"current_steps": 1329, "total_steps": 7063, "loss": 0.0047, "reward": -0.3728, "learning_rate": 1.4425216142803395e-06, "epoch": 0.19, "percentage": 18.82, "elapsed_time": "7:57:35", "remaining_time": "1 day, 10:20:35"} +{"current_steps": 1339, "total_steps": 7063, "loss": 0.0048, "reward": -0.3547, "learning_rate": 1.3805858917006148e-06, "epoch": 0.19, "percentage": 18.96, "elapsed_time": "8:01:16", "remaining_time": "1 day, 10:17:22"} +{"current_steps": 1349, "total_steps": 7063, "loss": 0.0043, "reward": -0.3398, "learning_rate": 1.3197955374462767e-06, "epoch": 0.19, "percentage": 19.1, "elapsed_time": "8:04:59", "remaining_time": "1 day, 10:14:17"} +{"current_steps": 1359, "total_steps": 7063, "loss": 0.0056, "reward": -0.2891, "learning_rate": 1.260169788704383e-06, "epoch": 0.19, "percentage": 19.24, "elapsed_time": "8:08:32", "remaining_time": "1 day, 10:10:32"} +{"current_steps": 1369, "total_steps": 7063, "loss": 0.0042, "reward": -0.3165, "learning_rate": 1.2017275141210604e-06, "epoch": 0.19, "percentage": 19.38, "elapsed_time": "8:12:12", "remaining_time": "1 day, 10:07:11"} +{"current_steps": 1379, "total_steps": 7063, "loss": 0.0039, "reward": -0.366, "learning_rate": 1.1444872078304865e-06, "epoch": 0.2, "percentage": 19.52, "elapsed_time": "8:15:51", "remaining_time": "1 day, 10:03:50"} +{"current_steps": 1389, "total_steps": 7063, "loss": 0.004, "reward": -0.2873, "learning_rate": 1.0884669836024058e-06, "epoch": 0.2, "percentage": 19.67, "elapsed_time": "8:19:28", "remaining_time": "1 day, 10:00:18"} +{"current_steps": 1399, "total_steps": 7063, "loss": 0.0046, "reward": -0.2922, "learning_rate": 1.033684569109994e-06, "epoch": 0.2, "percentage": 19.81, "elapsed_time": "8:23:05", "remaining_time": "1 day, 9:56:49"} +{"current_steps": 1409, "total_steps": 7063, "loss": 0.0037, "reward": -0.3076, "learning_rate": 9.80157300319926e-07, "epoch": 0.2, "percentage": 19.95, "elapsed_time": "8:26:41", "remaining_time": "1 day, 9:53:13"} +{"current_steps": 1419, "total_steps": 7063, "loss": 0.0066, "reward": -0.5213, "learning_rate": 9.279021160063712e-07, "epoch": 0.2, "percentage": 20.09, "elapsed_time": "8:30:07", "remaining_time": "1 day, 9:48:59"} +{"current_steps": 1429, "total_steps": 7063, "loss": 0.0044, "reward": -0.5063, "learning_rate": 8.769355523907086e-07, "epoch": 0.2, "percentage": 20.23, "elapsed_time": "8:33:45", "remaining_time": "1 day, 9:45:33"} +{"current_steps": 1439, "total_steps": 7063, "loss": 0.0041, "reward": -0.5909, "learning_rate": 8.272737379086088e-07, "epoch": 0.2, "percentage": 20.37, "elapsed_time": "8:37:23", "remaining_time": "1 day, 9:42:06"} +{"current_steps": 1449, "total_steps": 7063, "loss": 0.0044, "reward": -0.2486, "learning_rate": 7.789323881061777e-07, "epoch": 0.21, "percentage": 20.52, "elapsed_time": "8:41:10", "remaining_time": "1 day, 9:39:14"} +{"current_steps": 1459, "total_steps": 7063, "loss": 0.0044, "reward": -0.4971, "learning_rate": 7.31926800666744e-07, "epoch": 0.21, "percentage": 20.66, "elapsed_time": "8:44:52", "remaining_time": "1 day, 9:36:04"} +{"current_steps": 1469, "total_steps": 7063, "loss": 0.0043, "reward": -0.5182, "learning_rate": 6.862718505698945e-07, "epoch": 0.21, "percentage": 20.8, "elapsed_time": "8:48:24", "remaining_time": "1 day, 9:32:11"} +{"current_steps": 1479, "total_steps": 7063, "loss": 0.0046, "reward": -0.2389, "learning_rate": 6.419819853842591e-07, "epoch": 0.21, "percentage": 20.94, "elapsed_time": "8:52:03", "remaining_time": "1 day, 9:28:46"} +{"current_steps": 1489, "total_steps": 7063, "loss": 0.0039, "reward": -0.3725, "learning_rate": 5.990712206955674e-07, "epoch": 0.21, "percentage": 21.08, "elapsed_time": "8:55:47", "remaining_time": "1 day, 9:25:41"} +{"current_steps": 1499, "total_steps": 7063, "loss": 0.0046, "reward": -0.4709, "learning_rate": 5.575531356713904e-07, "epoch": 0.21, "percentage": 21.22, "elapsed_time": "8:59:14", "remaining_time": "1 day, 9:21:32"} +{"current_steps": 1509, "total_steps": 7063, "loss": 0.005, "reward": -0.3545, "learning_rate": 5.17440868764002e-07, "epoch": 0.21, "percentage": 21.36, "elapsed_time": "9:02:46", "remaining_time": "1 day, 9:17:45"} +{"current_steps": 1519, "total_steps": 7063, "loss": 0.0041, "reward": -0.2898, "learning_rate": 4.787471135526945e-07, "epoch": 0.22, "percentage": 21.51, "elapsed_time": "9:06:28", "remaining_time": "1 day, 9:14:28"} +{"current_steps": 1529, "total_steps": 7063, "loss": 0.0045, "reward": -0.4093, "learning_rate": 4.414841147268811e-07, "epoch": 0.22, "percentage": 21.65, "elapsed_time": "9:10:01", "remaining_time": "1 day, 9:10:43"} +{"current_steps": 1539, "total_steps": 7063, "loss": 0.004, "reward": -0.3965, "learning_rate": 4.056636642112427e-07, "epoch": 0.22, "percentage": 21.79, "elapsed_time": "9:13:40", "remaining_time": "1 day, 9:07:19"} +{"current_steps": 1549, "total_steps": 7063, "loss": 0.0045, "reward": -0.3877, "learning_rate": 3.7129709743416733e-07, "epoch": 0.22, "percentage": 21.93, "elapsed_time": "9:17:02", "remaining_time": "1 day, 9:02:54"} +{"current_steps": 1559, "total_steps": 7063, "loss": 0.0046, "reward": -0.3655, "learning_rate": 3.3839528974062843e-07, "epoch": 0.22, "percentage": 22.07, "elapsed_time": "9:20:31", "remaining_time": "1 day, 8:58:54"} +{"current_steps": 1569, "total_steps": 7063, "loss": 0.0045, "reward": -0.5236, "learning_rate": 3.069686529506777e-07, "epoch": 0.22, "percentage": 22.21, "elapsed_time": "9:24:04", "remaining_time": "1 day, 8:55:09"} +{"current_steps": 1579, "total_steps": 7063, "loss": 0.0053, "reward": -0.441, "learning_rate": 2.770271320646023e-07, "epoch": 0.22, "percentage": 22.36, "elapsed_time": "9:27:24", "remaining_time": "1 day, 8:50:39"} +{"current_steps": 1589, "total_steps": 7063, "loss": 0.004, "reward": -0.2618, "learning_rate": 2.4858020211582346e-07, "epoch": 0.22, "percentage": 22.5, "elapsed_time": "9:30:59", "remaining_time": "1 day, 8:47:00"} +{"current_steps": 1599, "total_steps": 7063, "loss": 0.004, "reward": -0.4623, "learning_rate": 2.2163686517250427e-07, "epoch": 0.23, "percentage": 22.64, "elapsed_time": "9:34:38", "remaining_time": "1 day, 8:43:37"} +{"current_steps": 1609, "total_steps": 7063, "loss": 0.0038, "reward": -0.2542, "learning_rate": 1.962056474888391e-07, "epoch": 0.23, "percentage": 22.78, "elapsed_time": "9:38:18", "remaining_time": "1 day, 8:40:17"} +{"current_steps": 1619, "total_steps": 7063, "loss": 0.0051, "reward": -0.377, "learning_rate": 1.7229459680690176e-07, "epoch": 0.23, "percentage": 22.92, "elapsed_time": "9:41:59", "remaining_time": "1 day, 8:37:00"} +{"current_steps": 1629, "total_steps": 7063, "loss": 0.0046, "reward": -0.3763, "learning_rate": 1.4991127980993503e-07, "epoch": 0.23, "percentage": 23.06, "elapsed_time": "9:45:40", "remaining_time": "1 day, 8:33:42"} +{"current_steps": 1639, "total_steps": 7063, "loss": 0.0046, "reward": -0.4469, "learning_rate": 1.290627797278593e-07, "epoch": 0.23, "percentage": 23.21, "elapsed_time": "9:49:23", "remaining_time": "1 day, 8:30:29"} +{"current_steps": 1649, "total_steps": 7063, "loss": 0.0054, "reward": -0.4301, "learning_rate": 1.0975569409577668e-07, "epoch": 0.23, "percentage": 23.35, "elapsed_time": "9:52:58", "remaining_time": "1 day, 8:26:51"} +{"current_steps": 1659, "total_steps": 7063, "loss": 0.0047, "reward": -0.481, "learning_rate": 9.199613266616891e-08, "epoch": 0.23, "percentage": 23.49, "elapsed_time": "9:56:37", "remaining_time": "1 day, 8:23:25"} +{"current_steps": 1669, "total_steps": 7063, "loss": 0.0047, "reward": -0.549, "learning_rate": 7.578971547546554e-08, "epoch": 0.24, "percentage": 23.63, "elapsed_time": "10:00:12", "remaining_time": "1 day, 8:19:47"} +{"current_steps": 1679, "total_steps": 7063, "loss": 0.0058, "reward": -0.3571, "learning_rate": 6.114157106556773e-08, "epoch": 0.24, "percentage": 23.77, "elapsed_time": "10:03:46", "remaining_time": "1 day, 8:16:05"} +{"current_steps": 1689, "total_steps": 7063, "loss": 0.005, "reward": -0.3539, "learning_rate": 4.8056334860921426e-08, "epoch": 0.24, "percentage": 23.91, "elapsed_time": "10:07:21", "remaining_time": "1 day, 8:12:27"} +{"current_steps": 1699, "total_steps": 7063, "loss": 0.0037, "reward": -0.3161, "learning_rate": 3.653814770162578e-08, "epoch": 0.24, "percentage": 24.05, "elapsed_time": "10:10:53", "remaining_time": "1 day, 8:08:41"} +{"current_steps": 1709, "total_steps": 7063, "loss": 0.0053, "reward": -0.4499, "learning_rate": 2.6590654533062975e-08, "epoch": 0.24, "percentage": 24.2, "elapsed_time": "10:14:32", "remaining_time": "1 day, 8:05:13"} +{"current_steps": 1719, "total_steps": 7063, "loss": 0.0047, "reward": -0.3267, "learning_rate": 1.821700325244813e-08, "epoch": 0.24, "percentage": 24.34, "elapsed_time": "10:17:59", "remaining_time": "1 day, 8:01:13"} +{"current_steps": 1729, "total_steps": 7063, "loss": 0.0043, "reward": -0.4299, "learning_rate": 1.141984371267335e-08, "epoch": 0.24, "percentage": 24.48, "elapsed_time": "10:21:40", "remaining_time": "1 day, 7:57:53"} +{"current_steps": 1739, "total_steps": 7063, "loss": 0.0051, "reward": -0.4119, "learning_rate": 6.2013268837601834e-09, "epoch": 0.25, "percentage": 24.62, "elapsed_time": "10:25:12", "remaining_time": "1 day, 7:54:04"} +{"current_steps": 1749, "total_steps": 7063, "loss": 0.0048, "reward": -0.492, "learning_rate": 2.5631041721801976e-09, "epoch": 0.25, "percentage": 24.76, "elapsed_time": "10:28:50", "remaining_time": "1 day, 7:50:35"} +{"current_steps": 1759, "total_steps": 7063, "loss": 0.0053, "reward": -0.5111, "learning_rate": 5.063268982646863e-10, "epoch": 0.25, "percentage": 24.9, "elapsed_time": "10:32:18", "remaining_time": "1 day, 7:46:37"} +{"current_steps": 1769, "total_steps": 7063, "loss": 0.0057, "reward": -0.5665, "learning_rate": 3.164593187165999e-11, "epoch": 0.25, "percentage": 25.05, "elapsed_time": "10:35:54", "remaining_time": "1 day, 7:43:02"} +{"current_steps": 1779, "total_steps": 7063, "loss": 0.0039, "reward": -0.3717, "learning_rate": 1.1392114864122727e-09, "epoch": 0.25, "percentage": 25.19, "elapsed_time": "10:39:34", "remaining_time": "1 day, 7:39:41"} +{"current_steps": 1789, "total_steps": 7063, "loss": 0.0049, "reward": -0.4831, "learning_rate": 3.828673071319955e-09, "epoch": 0.25, "percentage": 25.33, "elapsed_time": "10:43:12", "remaining_time": "1 day, 7:36:12"} +{"current_steps": 1799, "total_steps": 7063, "loss": 0.0052, "reward": -0.4277, "learning_rate": 8.099179602960583e-09, "epoch": 0.25, "percentage": 25.47, "elapsed_time": "10:46:51", "remaining_time": "1 day, 7:32:46"} +{"current_steps": 1809, "total_steps": 7063, "loss": 0.0047, "reward": -0.3236, "learning_rate": 1.3949379673960372e-08, "epoch": 0.26, "percentage": 25.61, "elapsed_time": "10:50:34", "remaining_time": "1 day, 7:29:29"} +{"current_steps": 1819, "total_steps": 7063, "loss": 0.0044, "reward": -0.4584, "learning_rate": 2.1377421980859903e-08, "epoch": 0.26, "percentage": 25.75, "elapsed_time": "10:54:14", "remaining_time": "1 day, 7:26:07"} +{"current_steps": 1829, "total_steps": 7063, "loss": 0.004, "reward": -0.427, "learning_rate": 3.0380955909962706e-08, "epoch": 0.26, "percentage": 25.9, "elapsed_time": "10:57:49", "remaining_time": "1 day, 7:22:28"} +{"current_steps": 1839, "total_steps": 7063, "loss": 0.0046, "reward": -0.4793, "learning_rate": 4.095713228118803e-08, "epoch": 0.26, "percentage": 26.04, "elapsed_time": "11:01:27", "remaining_time": "1 day, 7:19:00"} +{"current_steps": 1849, "total_steps": 7063, "loss": 0.005, "reward": -0.3642, "learning_rate": 5.310260424970071e-08, "epoch": 0.26, "percentage": 26.18, "elapsed_time": "11:04:56", "remaining_time": "1 day, 7:15:04"} +{"current_steps": 1859, "total_steps": 7063, "loss": 0.0036, "reward": -0.3235, "learning_rate": 6.681352836502009e-08, "epoch": 0.26, "percentage": 26.32, "elapsed_time": "11:08:38", "remaining_time": "1 day, 7:11:46"} +{"current_steps": 1869, "total_steps": 7063, "loss": 0.0055, "reward": -0.4695, "learning_rate": 8.208556578728933e-08, "epoch": 0.26, "percentage": 26.46, "elapsed_time": "11:12:16", "remaining_time": "1 day, 7:08:16"} +{"current_steps": 1879, "total_steps": 7063, "loss": 0.005, "reward": -0.3998, "learning_rate": 9.891388366030486e-08, "epoch": 0.27, "percentage": 26.6, "elapsed_time": "11:16:02", "remaining_time": "1 day, 7:05:08"} +{"current_steps": 1889, "total_steps": 7063, "loss": 0.0046, "reward": -0.3878, "learning_rate": 1.172931566408797e-07, "epoch": 0.27, "percentage": 26.75, "elapsed_time": "11:19:46", "remaining_time": "1 day, 7:01:53"} +{"current_steps": 1899, "total_steps": 7063, "loss": 0.0055, "reward": -0.5067, "learning_rate": 1.3721756858405545e-07, "epoch": 0.27, "percentage": 26.89, "elapsed_time": "11:23:18", "remaining_time": "1 day, 6:58:09"} +{"current_steps": 1909, "total_steps": 7063, "loss": 0.0038, "reward": -0.3747, "learning_rate": 1.5868081438363213e-07, "epoch": 0.27, "percentage": 27.03, "elapsed_time": "11:26:55", "remaining_time": "1 day, 6:54:34"} +{"current_steps": 1919, "total_steps": 7063, "loss": 0.0052, "reward": -0.2461, "learning_rate": 1.8167610196742125e-07, "epoch": 0.27, "percentage": 27.17, "elapsed_time": "11:30:27", "remaining_time": "1 day, 6:50:50"} +{"current_steps": 1929, "total_steps": 7063, "loss": 0.0044, "reward": -0.2565, "learning_rate": 2.0619615444661012e-07, "epoch": 0.27, "percentage": 27.31, "elapsed_time": "11:34:02", "remaining_time": "1 day, 6:47:11"} +{"current_steps": 1939, "total_steps": 7063, "loss": 0.0045, "reward": -0.4397, "learning_rate": 2.3223321241854335e-07, "epoch": 0.27, "percentage": 27.45, "elapsed_time": "11:37:39", "remaining_time": "1 day, 6:43:38"} +{"current_steps": 1949, "total_steps": 7063, "loss": 0.0047, "reward": -0.2828, "learning_rate": 2.5977903642219305e-07, "epoch": 0.28, "percentage": 27.59, "elapsed_time": "11:41:14", "remaining_time": "1 day, 6:39:58"} +{"current_steps": 1959, "total_steps": 7063, "loss": 0.0049, "reward": -0.361, "learning_rate": 2.8882490954554976e-07, "epoch": 0.28, "percentage": 27.74, "elapsed_time": "11:44:52", "remaining_time": "1 day, 6:36:30"} +{"current_steps": 1969, "total_steps": 7063, "loss": 0.0054, "reward": -0.2941, "learning_rate": 3.193616401840971e-07, "epoch": 0.28, "percentage": 27.88, "elapsed_time": "11:48:22", "remaining_time": "1 day, 6:32:37"} +{"current_steps": 1979, "total_steps": 7063, "loss": 0.0046, "reward": -0.3027, "learning_rate": 3.513795649495133e-07, "epoch": 0.28, "percentage": 28.02, "elapsed_time": "11:51:55", "remaining_time": "1 day, 6:28:55"} +{"current_steps": 1989, "total_steps": 7063, "loss": 0.0037, "reward": -0.391, "learning_rate": 3.848685517276546e-07, "epoch": 0.28, "percentage": 28.16, "elapsed_time": "11:55:32", "remaining_time": "1 day, 6:25:23"} +{"current_steps": 1999, "total_steps": 7063, "loss": 0.0048, "reward": -0.3608, "learning_rate": 4.1981800288488416e-07, "epoch": 0.28, "percentage": 28.3, "elapsed_time": "11:59:25", "remaining_time": "1 day, 6:22:29"} +{"current_steps": 2009, "total_steps": 7063, "loss": 0.0044, "reward": -0.3958, "learning_rate": 4.562168586217008e-07, "epoch": 0.28, "percentage": 28.44, "elapsed_time": "12:03:17", "remaining_time": "1 day, 6:19:33"} +{"current_steps": 2019, "total_steps": 7063, "loss": 0.0072, "reward": -0.5123, "learning_rate": 4.940536004726337e-07, "epoch": 0.29, "percentage": 28.59, "elapsed_time": "12:06:58", "remaining_time": "1 day, 6:16:10"} +{"current_steps": 2029, "total_steps": 7063, "loss": 0.0044, "reward": -0.2958, "learning_rate": 5.33316254951266e-07, "epoch": 0.29, "percentage": 28.73, "elapsed_time": "12:10:57", "remaining_time": "1 day, 6:13:32"} +{"current_steps": 2039, "total_steps": 7063, "loss": 0.0047, "reward": -0.4311, "learning_rate": 5.739923973392685e-07, "epoch": 0.29, "percentage": 28.87, "elapsed_time": "12:14:32", "remaining_time": "1 day, 6:09:53"} +{"current_steps": 2049, "total_steps": 7063, "loss": 0.0039, "reward": -0.4388, "learning_rate": 6.160691556182191e-07, "epoch": 0.29, "percentage": 29.01, "elapsed_time": "12:18:08", "remaining_time": "1 day, 6:06:16"} +{"current_steps": 2059, "total_steps": 7063, "loss": 0.0066, "reward": -0.4963, "learning_rate": 6.595332145429611e-07, "epoch": 0.29, "percentage": 29.15, "elapsed_time": "12:21:35", "remaining_time": "1 day, 6:02:18"} +{"current_steps": 2069, "total_steps": 7063, "loss": 0.0051, "reward": -0.3088, "learning_rate": 7.043708198552385e-07, "epoch": 0.29, "percentage": 29.29, "elapsed_time": "12:25:06", "remaining_time": "1 day, 5:58:29"} +{"current_steps": 2079, "total_steps": 7063, "loss": 0.0054, "reward": -0.3397, "learning_rate": 7.505677826362434e-07, "epoch": 0.29, "percentage": 29.44, "elapsed_time": "12:28:49", "remaining_time": "1 day, 5:55:08"} +{"current_steps": 2089, "total_steps": 7063, "loss": 0.0044, "reward": -0.4052, "learning_rate": 7.981094837967229e-07, "epoch": 0.3, "percentage": 29.58, "elapsed_time": "12:32:26", "remaining_time": "1 day, 5:51:35"} +{"current_steps": 2099, "total_steps": 7063, "loss": 0.0049, "reward": -0.3994, "learning_rate": 8.46980878703203e-07, "epoch": 0.3, "percentage": 29.72, "elapsed_time": "12:36:01", "remaining_time": "1 day, 5:47:56"} +{"current_steps": 2109, "total_steps": 7063, "loss": 0.0051, "reward": -0.4254, "learning_rate": 8.971665019388887e-07, "epoch": 0.3, "percentage": 29.86, "elapsed_time": "12:39:30", "remaining_time": "1 day, 5:44:04"} +{"current_steps": 2119, "total_steps": 7063, "loss": 0.0043, "reward": -0.3374, "learning_rate": 9.486504721977097e-07, "epoch": 0.3, "percentage": 30.0, "elapsed_time": "12:43:01", "remaining_time": "1 day, 5:40:15"} +{"current_steps": 2129, "total_steps": 7063, "loss": 0.0058, "reward": -0.3854, "learning_rate": 1.0014164973099866e-06, "epoch": 0.3, "percentage": 30.14, "elapsed_time": "12:46:29", "remaining_time": "1 day, 5:36:20"} +{"current_steps": 2139, "total_steps": 7063, "loss": 0.0043, "reward": -0.3606, "learning_rate": 1.0554478793981015e-06, "epoch": 0.3, "percentage": 30.28, "elapsed_time": "12:50:02", "remaining_time": "1 day, 5:32:38"} +{"current_steps": 2149, "total_steps": 7063, "loss": 0.0041, "reward": -0.3453, "learning_rate": 1.1107275201605728e-06, "epoch": 0.3, "percentage": 30.43, "elapsed_time": "12:53:35", "remaining_time": "1 day, 5:28:56"} +{"current_steps": 2159, "total_steps": 7063, "loss": 0.008, "reward": -0.3853, "learning_rate": 1.1672379262828238e-06, "epoch": 0.31, "percentage": 30.57, "elapsed_time": "12:57:14", "remaining_time": "1 day, 5:25:26"} +{"current_steps": 2169, "total_steps": 7063, "loss": 0.0052, "reward": -0.3406, "learning_rate": 1.2249612149729779e-06, "epoch": 0.31, "percentage": 30.71, "elapsed_time": "13:00:57", "remaining_time": "1 day, 5:22:06"} +{"current_steps": 2179, "total_steps": 7063, "loss": 0.0043, "reward": -0.3696, "learning_rate": 1.2838791196208771e-06, "epoch": 0.31, "percentage": 30.85, "elapsed_time": "13:04:38", "remaining_time": "1 day, 5:18:41"} +{"current_steps": 2189, "total_steps": 7063, "loss": 0.0048, "reward": -0.326, "learning_rate": 1.3439729955785901e-06, "epoch": 0.31, "percentage": 30.99, "elapsed_time": "13:08:16", "remaining_time": "1 day, 5:15:09"} +{"current_steps": 2199, "total_steps": 7063, "loss": 0.0048, "reward": -0.3875, "learning_rate": 1.40522382606052e-06, "epoch": 0.31, "percentage": 31.13, "elapsed_time": "13:12:03", "remaining_time": "1 day, 5:11:57"} +{"current_steps": 2209, "total_steps": 7063, "loss": 0.0044, "reward": -0.3224, "learning_rate": 1.4676122281613041e-06, "epoch": 0.31, "percentage": 31.28, "elapsed_time": "13:15:39", "remaining_time": "1 day, 5:08:20"} +{"current_steps": 2219, "total_steps": 7063, "loss": 0.0054, "reward": -0.4125, "learning_rate": 1.5311184589895495e-06, "epoch": 0.31, "percentage": 31.42, "elapsed_time": "13:19:12", "remaining_time": "1 day, 5:04:38"} +{"current_steps": 2229, "total_steps": 7063, "loss": 0.0051, "reward": -0.5115, "learning_rate": 1.595722421915507e-06, "epoch": 0.32, "percentage": 31.56, "elapsed_time": "13:22:55", "remaining_time": "1 day, 5:01:16"} +{"current_steps": 2239, "total_steps": 7063, "loss": 0.0042, "reward": -0.5107, "learning_rate": 1.6614036729306638e-06, "epoch": 0.32, "percentage": 31.7, "elapsed_time": "13:26:34", "remaining_time": "1 day, 4:57:48"} +{"current_steps": 2249, "total_steps": 7063, "loss": 0.0048, "reward": -0.4813, "learning_rate": 1.7281414271172925e-06, "epoch": 0.32, "percentage": 31.84, "elapsed_time": "13:30:10", "remaining_time": "1 day, 4:54:12"} +{"current_steps": 2259, "total_steps": 7063, "loss": 0.0036, "reward": -0.2592, "learning_rate": 1.7959145652258408e-06, "epoch": 0.32, "percentage": 31.98, "elapsed_time": "13:33:58", "remaining_time": "1 day, 4:51:00"} +{"current_steps": 2269, "total_steps": 7063, "loss": 0.0045, "reward": -0.431, "learning_rate": 1.8647016403581763e-06, "epoch": 0.32, "percentage": 32.13, "elapsed_time": "13:37:31", "remaining_time": "1 day, 4:47:16"} +{"current_steps": 2279, "total_steps": 7063, "loss": 0.0045, "reward": -0.3041, "learning_rate": 1.9344808847544632e-06, "epoch": 0.32, "percentage": 32.27, "elapsed_time": "13:41:09", "remaining_time": "1 day, 4:43:44"} +{"current_steps": 2289, "total_steps": 7063, "loss": 0.0054, "reward": -0.2746, "learning_rate": 2.0052302166816017e-06, "epoch": 0.32, "percentage": 32.41, "elapsed_time": "13:44:45", "remaining_time": "1 day, 4:40:08"} +{"current_steps": 2299, "total_steps": 7063, "loss": 0.0059, "reward": -0.5107, "learning_rate": 2.0769272474210374e-06, "epoch": 0.33, "percentage": 32.55, "elapsed_time": "13:48:25", "remaining_time": "1 day, 4:36:40"} +{"current_steps": 2309, "total_steps": 7063, "loss": 0.0044, "reward": -0.3638, "learning_rate": 2.149549288353676e-06, "epoch": 0.33, "percentage": 32.69, "elapsed_time": "13:51:55", "remaining_time": "1 day, 4:32:51"} +{"current_steps": 2319, "total_steps": 7063, "loss": 0.0055, "reward": -0.3426, "learning_rate": 2.2230733581397427e-06, "epoch": 0.33, "percentage": 32.83, "elapsed_time": "13:55:26", "remaining_time": "1 day, 4:29:03"} +{"current_steps": 2329, "total_steps": 7063, "loss": 0.0048, "reward": -0.3561, "learning_rate": 2.297476189991249e-06, "epoch": 0.33, "percentage": 32.97, "elapsed_time": "13:59:02", "remaining_time": "1 day, 4:25:27"} +{"current_steps": 2339, "total_steps": 7063, "loss": 0.0058, "reward": -0.334, "learning_rate": 2.3727342390348134e-06, "epoch": 0.33, "percentage": 33.12, "elapsed_time": "14:02:38", "remaining_time": "1 day, 4:21:50"} +{"current_steps": 2349, "total_steps": 7063, "loss": 0.0043, "reward": -0.188, "learning_rate": 2.4488236897624457e-06, "epoch": 0.33, "percentage": 33.26, "elapsed_time": "14:06:02", "remaining_time": "1 day, 4:17:49"} +{"current_steps": 2359, "total_steps": 7063, "loss": 0.005, "reward": -0.3464, "learning_rate": 2.525720463568009e-06, "epoch": 0.33, "percentage": 33.4, "elapsed_time": "14:09:42", "remaining_time": "1 day, 4:14:23"} +{"current_steps": 2369, "total_steps": 7063, "loss": 0.0041, "reward": -0.4215, "learning_rate": 2.603400226366919e-06, "epoch": 0.34, "percentage": 33.54, "elapsed_time": "14:13:33", "remaining_time": "1 day, 4:11:15"} +{"current_steps": 2379, "total_steps": 7063, "loss": 0.0059, "reward": -0.483, "learning_rate": 2.6818383962967134e-06, "epoch": 0.34, "percentage": 33.68, "elapsed_time": "14:17:07", "remaining_time": "1 day, 4:07:34"} +{"current_steps": 2389, "total_steps": 7063, "loss": 0.0042, "reward": -0.3055, "learning_rate": 2.7610101514959903e-06, "epoch": 0.34, "percentage": 33.82, "elapsed_time": "14:20:37", "remaining_time": "1 day, 4:03:46"} +{"current_steps": 2399, "total_steps": 7063, "loss": 0.0047, "reward": -0.2254, "learning_rate": 2.840890437959334e-06, "epoch": 0.34, "percentage": 33.97, "elapsed_time": "14:24:10", "remaining_time": "1 day, 4:00:03"} +{"current_steps": 2409, "total_steps": 7063, "loss": 0.0049, "reward": -0.4363, "learning_rate": 2.92145397746568e-06, "epoch": 0.34, "percentage": 34.11, "elapsed_time": "14:27:38", "remaining_time": "1 day, 3:56:12"} +{"current_steps": 2419, "total_steps": 7063, "loss": 0.0053, "reward": -0.4156, "learning_rate": 3.002675275577659e-06, "epoch": 0.34, "percentage": 34.25, "elapsed_time": "14:31:20", "remaining_time": "1 day, 3:52:48"} +{"current_steps": 2429, "total_steps": 7063, "loss": 0.0032, "reward": -0.3561, "learning_rate": 3.0845286297093167e-06, "epoch": 0.34, "percentage": 34.39, "elapsed_time": "14:35:04", "remaining_time": "1 day, 3:49:27"} +{"current_steps": 2439, "total_steps": 7063, "loss": 0.0039, "reward": -0.4369, "learning_rate": 3.166988137259751e-06, "epoch": 0.35, "percentage": 34.53, "elapsed_time": "14:38:42", "remaining_time": "1 day, 3:45:54"} +{"current_steps": 2449, "total_steps": 7063, "loss": 0.0049, "reward": -0.431, "learning_rate": 3.2500277038100126e-06, "epoch": 0.35, "percentage": 34.67, "elapsed_time": "14:42:22", "remaining_time": "1 day, 3:42:26"} +{"current_steps": 2459, "total_steps": 7063, "loss": 0.0047, "reward": -0.4215, "learning_rate": 3.3336210513807366e-06, "epoch": 0.35, "percentage": 34.82, "elapsed_time": "14:46:01", "remaining_time": "1 day, 3:38:53"} +{"current_steps": 2469, "total_steps": 7063, "loss": 0.0044, "reward": -0.2004, "learning_rate": 3.4177417267478236e-06, "epoch": 0.35, "percentage": 34.96, "elapsed_time": "14:49:33", "remaining_time": "1 day, 3:35:10"} +{"current_steps": 2479, "total_steps": 7063, "loss": 0.0039, "reward": -0.3595, "learning_rate": 3.502363109813589e-06, "epoch": 0.35, "percentage": 35.1, "elapsed_time": "14:53:07", "remaining_time": "1 day, 3:31:31"} +{"current_steps": 2489, "total_steps": 7063, "loss": 0.0052, "reward": -0.3384, "learning_rate": 3.5874584220307686e-06, "epoch": 0.35, "percentage": 35.24, "elapsed_time": "14:56:50", "remaining_time": "1 day, 3:28:06"} +{"current_steps": 2499, "total_steps": 7063, "loss": 0.0042, "reward": -0.1973, "learning_rate": 3.673000734876582e-06, "epoch": 0.35, "percentage": 35.38, "elapsed_time": "15:00:24", "remaining_time": "1 day, 3:24:27"} +{"current_steps": 2509, "total_steps": 7063, "loss": 0.0044, "reward": -0.4077, "learning_rate": 3.7589629783743188e-06, "epoch": 0.36, "percentage": 35.52, "elapsed_time": "15:04:01", "remaining_time": "1 day, 3:20:52"} +{"current_steps": 2519, "total_steps": 7063, "loss": 0.0046, "reward": -0.5238, "learning_rate": 3.845317949659662e-06, "epoch": 0.36, "percentage": 35.66, "elapsed_time": "15:07:33", "remaining_time": "1 day, 3:17:07"} +{"current_steps": 2529, "total_steps": 7063, "loss": 0.0039, "reward": -0.3569, "learning_rate": 3.932038321589086e-06, "epoch": 0.36, "percentage": 35.81, "elapsed_time": "15:11:09", "remaining_time": "1 day, 3:13:32"} +{"current_steps": 2539, "total_steps": 7063, "loss": 0.005, "reward": -0.4477, "learning_rate": 4.01909665138754e-06, "epoch": 0.36, "percentage": 35.95, "elapsed_time": "15:14:38", "remaining_time": "1 day, 3:09:42"} +{"current_steps": 2549, "total_steps": 7063, "loss": 0.0035, "reward": -0.303, "learning_rate": 4.106465389332768e-06, "epoch": 0.36, "percentage": 36.09, "elapsed_time": "15:18:13", "remaining_time": "1 day, 3:06:03"} +{"current_steps": 2559, "total_steps": 7063, "loss": 0.0042, "reward": -0.3804, "learning_rate": 4.194116887473445e-06, "epoch": 0.36, "percentage": 36.23, "elapsed_time": "15:21:51", "remaining_time": "1 day, 3:02:31"} +{"current_steps": 2569, "total_steps": 7063, "loss": 0.0047, "reward": -0.4259, "learning_rate": 4.282023408378429e-06, "epoch": 0.36, "percentage": 36.37, "elapsed_time": "15:25:33", "remaining_time": "1 day, 2:59:05"} +{"current_steps": 2579, "total_steps": 7063, "loss": 0.0049, "reward": -0.3371, "learning_rate": 4.370157133914274e-06, "epoch": 0.37, "percentage": 36.51, "elapsed_time": "15:29:06", "remaining_time": "1 day, 2:55:23"} +{"current_steps": 2589, "total_steps": 7063, "loss": 0.0047, "reward": -0.4291, "learning_rate": 4.458490174048339e-06, "epoch": 0.37, "percentage": 36.66, "elapsed_time": "15:32:43", "remaining_time": "1 day, 2:51:48"} +{"current_steps": 2599, "total_steps": 7063, "loss": 0.0044, "reward": -0.4106, "learning_rate": 4.5469945756746145e-06, "epoch": 0.37, "percentage": 36.8, "elapsed_time": "15:36:21", "remaining_time": "1 day, 2:48:17"} +{"current_steps": 2609, "total_steps": 7063, "loss": 0.0036, "reward": -0.3657, "learning_rate": 4.635642331459522e-06, "epoch": 0.37, "percentage": 36.94, "elapsed_time": "15:39:53", "remaining_time": "1 day, 2:44:32"} +{"current_steps": 2619, "total_steps": 7063, "loss": 0.0052, "reward": -0.3857, "learning_rate": 4.724405388704883e-06, "epoch": 0.37, "percentage": 37.08, "elapsed_time": "15:43:28", "remaining_time": "1 day, 2:40:55"} +{"current_steps": 2629, "total_steps": 7063, "loss": 0.0047, "reward": -0.3853, "learning_rate": 4.804367507873278e-06, "epoch": 0.37, "percentage": 37.22, "elapsed_time": "15:47:00", "remaining_time": "1 day, 2:37:11"} +{"current_steps": 2639, "total_steps": 7063, "loss": 0.0054, "reward": -0.3366, "learning_rate": 4.893272229193558e-06, "epoch": 0.37, "percentage": 37.36, "elapsed_time": "15:50:35", "remaining_time": "1 day, 2:33:34"} +{"current_steps": 2649, "total_steps": 7063, "loss": 0.005, "reward": -0.4375, "learning_rate": 4.982210724656406e-06, "epoch": 0.38, "percentage": 37.51, "elapsed_time": "15:54:07", "remaining_time": "1 day, 2:29:50"} +{"current_steps": 2659, "total_steps": 7063, "loss": 0.0043, "reward": -0.3342, "learning_rate": 5.071154849558693e-06, "epoch": 0.38, "percentage": 37.65, "elapsed_time": "15:57:41", "remaining_time": "1 day, 2:26:12"} +{"current_steps": 2669, "total_steps": 7063, "loss": 0.0047, "reward": -0.4507, "learning_rate": 5.160076457415833e-06, "epoch": 0.38, "percentage": 37.79, "elapsed_time": "16:01:19", "remaining_time": "1 day, 2:22:37"} +{"current_steps": 2679, "total_steps": 7063, "loss": 0.005, "reward": -0.4391, "learning_rate": 5.248947408868792e-06, "epoch": 0.38, "percentage": 37.93, "elapsed_time": "16:04:52", "remaining_time": "1 day, 2:18:57"} +{"current_steps": 2689, "total_steps": 7063, "loss": 0.0036, "reward": -0.2586, "learning_rate": 5.33773958058882e-06, "epoch": 0.38, "percentage": 38.07, "elapsed_time": "16:08:30", "remaining_time": "1 day, 2:15:24"} +{"current_steps": 2699, "total_steps": 7063, "loss": 0.0044, "reward": -0.4199, "learning_rate": 5.426424874177126e-06, "epoch": 0.38, "percentage": 38.21, "elapsed_time": "16:12:06", "remaining_time": "1 day, 2:11:47"} +{"current_steps": 2709, "total_steps": 7063, "loss": 0.0044, "reward": -0.4119, "learning_rate": 5.514975225056634e-06, "epoch": 0.38, "percentage": 38.35, "elapsed_time": "16:15:50", "remaining_time": "1 day, 2:08:24"} +{"current_steps": 2719, "total_steps": 7063, "loss": 0.0043, "reward": -0.3747, "learning_rate": 5.603362611353067e-06, "epoch": 0.38, "percentage": 38.5, "elapsed_time": "16:19:25", "remaining_time": "1 day, 2:04:46"} +{"current_steps": 2729, "total_steps": 7063, "loss": 0.0051, "reward": -0.2529, "learning_rate": 5.691559062762498e-06, "epoch": 0.39, "percentage": 38.64, "elapsed_time": "16:23:03", "remaining_time": "1 day, 2:01:13"} +{"current_steps": 2739, "total_steps": 7063, "loss": 0.0038, "reward": -0.3863, "learning_rate": 5.779536669402608e-06, "epoch": 0.39, "percentage": 38.78, "elapsed_time": "16:26:45", "remaining_time": "1 day, 1:57:46"} +{"current_steps": 2749, "total_steps": 7063, "loss": 0.0043, "reward": -0.4039, "learning_rate": 5.867267590644781e-06, "epoch": 0.39, "percentage": 38.92, "elapsed_time": "16:30:22", "remaining_time": "1 day, 1:54:10"} +{"current_steps": 2759, "total_steps": 7063, "loss": 0.0041, "reward": -0.3328, "learning_rate": 5.954724063924317e-06, "epoch": 0.39, "percentage": 39.06, "elapsed_time": "16:34:06", "remaining_time": "1 day, 1:50:47"} +{"current_steps": 2769, "total_steps": 7063, "loss": 0.0044, "reward": -0.2204, "learning_rate": 6.041878413525932e-06, "epoch": 0.39, "percentage": 39.2, "elapsed_time": "16:37:44", "remaining_time": "1 day, 1:47:14"} +{"current_steps": 2779, "total_steps": 7063, "loss": 0.0056, "reward": -0.4904, "learning_rate": 6.128703059341788e-06, "epoch": 0.39, "percentage": 39.35, "elapsed_time": "16:41:27", "remaining_time": "1 day, 1:43:49"} +{"current_steps": 2789, "total_steps": 7063, "loss": 0.0047, "reward": -0.3944, "learning_rate": 6.215170525599225e-06, "epoch": 0.39, "percentage": 39.49, "elapsed_time": "16:45:00", "remaining_time": "1 day, 1:40:07"} +{"current_steps": 2799, "total_steps": 7063, "loss": 0.0053, "reward": -0.5206, "learning_rate": 6.3012534495555275e-06, "epoch": 0.4, "percentage": 39.63, "elapsed_time": "16:48:30", "remaining_time": "1 day, 1:36:21"} +{"current_steps": 2809, "total_steps": 7063, "loss": 0.0033, "reward": -0.1779, "learning_rate": 6.386924590156891e-06, "epoch": 0.4, "percentage": 39.77, "elapsed_time": "16:52:10", "remaining_time": "1 day, 1:32:51"} +{"current_steps": 2819, "total_steps": 7063, "loss": 0.0045, "reward": -0.4464, "learning_rate": 6.4721568366589e-06, "epoch": 0.4, "percentage": 39.91, "elapsed_time": "16:55:36", "remaining_time": "1 day, 1:29:00"} +{"current_steps": 2829, "total_steps": 7063, "loss": 0.0036, "reward": -0.3361, "learning_rate": 6.556923217205744e-06, "epoch": 0.4, "percentage": 40.05, "elapsed_time": "16:59:11", "remaining_time": "1 day, 1:25:21"} +{"current_steps": 2839, "total_steps": 7063, "loss": 0.0049, "reward": -0.5177, "learning_rate": 6.641196907365499e-06, "epoch": 0.4, "percentage": 40.2, "elapsed_time": "17:02:45", "remaining_time": "1 day, 1:21:42"} +{"current_steps": 2849, "total_steps": 7063, "loss": 0.0048, "reward": -0.4074, "learning_rate": 6.724951238618763e-06, "epoch": 0.4, "percentage": 40.34, "elapsed_time": "17:06:16", "remaining_time": "1 day, 1:17:58"} +{"current_steps": 2859, "total_steps": 7063, "loss": 0.0047, "reward": -0.2954, "learning_rate": 6.808159706797949e-06, "epoch": 0.4, "percentage": 40.48, "elapsed_time": "17:09:43", "remaining_time": "1 day, 1:14:09"} +{"current_steps": 2869, "total_steps": 7063, "loss": 0.0046, "reward": -0.312, "learning_rate": 6.8907959804745294e-06, "epoch": 0.41, "percentage": 40.62, "elapsed_time": "17:13:33", "remaining_time": "1 day, 1:10:53"} +{"current_steps": 2879, "total_steps": 7063, "loss": 0.0053, "reward": -0.4417, "learning_rate": 6.972833909291694e-06, "epoch": 0.41, "percentage": 40.76, "elapsed_time": "17:17:10", "remaining_time": "1 day, 1:07:19"} +{"current_steps": 2889, "total_steps": 7063, "loss": 0.0036, "reward": -0.2909, "learning_rate": 7.054247532239634e-06, "epoch": 0.41, "percentage": 40.9, "elapsed_time": "17:20:56", "remaining_time": "1 day, 1:03:55"} +{"current_steps": 2899, "total_steps": 7063, "loss": 0.0044, "reward": -0.2276, "learning_rate": 7.135011085870964e-06, "epoch": 0.41, "percentage": 41.04, "elapsed_time": "17:24:26", "remaining_time": "1 day, 1:00:12"} +{"current_steps": 2909, "total_steps": 7063, "loss": 0.0049, "reward": -0.3637, "learning_rate": 7.21509901245357e-06, "epoch": 0.41, "percentage": 41.19, "elapsed_time": "17:28:03", "remaining_time": "1 day, 0:56:36"} +{"current_steps": 2919, "total_steps": 7063, "loss": 0.0067, "reward": -0.3676, "learning_rate": 7.294485968058404e-06, "epoch": 0.41, "percentage": 41.33, "elapsed_time": "17:31:41", "remaining_time": "1 day, 0:53:02"} +{"current_steps": 2929, "total_steps": 7063, "loss": 0.0034, "reward": -0.1601, "learning_rate": 7.373146830579596e-06, "epoch": 0.41, "percentage": 41.47, "elapsed_time": "17:35:22", "remaining_time": "1 day, 0:49:32"} +{"current_steps": 2939, "total_steps": 7063, "loss": 0.0041, "reward": -0.1314, "learning_rate": 7.451056707684396e-06, "epoch": 0.42, "percentage": 41.61, "elapsed_time": "17:38:57", "remaining_time": "1 day, 0:45:56"} +{"current_steps": 2949, "total_steps": 7063, "loss": 0.0035, "reward": -0.2391, "learning_rate": 7.528190944690356e-06, "epoch": 0.42, "percentage": 41.75, "elapsed_time": "17:42:38", "remaining_time": "1 day, 0:42:26"} +{"current_steps": 2959, "total_steps": 7063, "loss": 0.0052, "reward": -0.4042, "learning_rate": 7.6045251323673555e-06, "epoch": 0.42, "percentage": 41.89, "elapsed_time": "17:46:01", "remaining_time": "1 day, 0:38:31"} +{"current_steps": 2969, "total_steps": 7063, "loss": 0.0044, "reward": -0.3035, "learning_rate": 7.680035114661929e-06, "epoch": 0.42, "percentage": 42.04, "elapsed_time": "17:49:35", "remaining_time": "1 day, 0:34:51"} +{"current_steps": 2979, "total_steps": 7063, "loss": 0.0049, "reward": -0.3552, "learning_rate": 7.754696996341486e-06, "epoch": 0.42, "percentage": 42.18, "elapsed_time": "17:53:08", "remaining_time": "1 day, 0:31:11"} +{"current_steps": 2989, "total_steps": 7063, "loss": 0.0049, "reward": -0.2459, "learning_rate": 7.828487150555979e-06, "epoch": 0.42, "percentage": 42.32, "elapsed_time": "17:56:34", "remaining_time": "1 day, 0:27:22"} +{"current_steps": 2999, "total_steps": 7063, "loss": 0.0036, "reward": -0.2989, "learning_rate": 7.901382226314662e-06, "epoch": 0.42, "percentage": 42.46, "elapsed_time": "18:00:17", "remaining_time": "1 day, 0:23:54"} +{"current_steps": 3009, "total_steps": 7063, "loss": 0.0057, "reward": -0.5494, "learning_rate": 7.973359155875521e-06, "epoch": 0.43, "percentage": 42.6, "elapsed_time": "18:03:55", "remaining_time": "1 day, 0:20:21"} +{"current_steps": 3019, "total_steps": 7063, "loss": 0.0045, "reward": -0.3344, "learning_rate": 8.044395162045135e-06, "epoch": 0.43, "percentage": 42.74, "elapsed_time": "18:07:31", "remaining_time": "1 day, 0:16:44"} +{"current_steps": 3029, "total_steps": 7063, "loss": 0.0045, "reward": -0.3949, "learning_rate": 8.11446776538649e-06, "epoch": 0.43, "percentage": 42.89, "elapsed_time": "18:11:00", "remaining_time": "1 day, 0:13:00"} +{"current_steps": 3039, "total_steps": 7063, "loss": 0.004, "reward": -0.2997, "learning_rate": 8.183554791332675e-06, "epoch": 0.43, "percentage": 43.03, "elapsed_time": "18:14:38", "remaining_time": "1 day, 0:09:26"} +{"current_steps": 3049, "total_steps": 7063, "loss": 0.0034, "reward": -0.2654, "learning_rate": 8.251634377204023e-06, "epoch": 0.43, "percentage": 43.17, "elapsed_time": "18:18:13", "remaining_time": "1 day, 0:05:48"} +{"current_steps": 3059, "total_steps": 7063, "loss": 0.0034, "reward": -0.4013, "learning_rate": 8.318684979126607e-06, "epoch": 0.43, "percentage": 43.31, "elapsed_time": "18:21:54", "remaining_time": "1 day, 0:02:19"} +{"current_steps": 3069, "total_steps": 7063, "loss": 0.0035, "reward": -0.4777, "learning_rate": 8.384685378849804e-06, "epoch": 0.43, "percentage": 43.45, "elapsed_time": "18:25:35", "remaining_time": "23:58:49"} +{"current_steps": 3079, "total_steps": 7063, "loss": 0.0031, "reward": -0.3525, "learning_rate": 8.44961469046086e-06, "epoch": 0.44, "percentage": 43.59, "elapsed_time": "18:29:20", "remaining_time": "23:55:24"} +{"current_steps": 3089, "total_steps": 7063, "loss": 0.0042, "reward": -0.1987, "learning_rate": 8.513452366994242e-06, "epoch": 0.44, "percentage": 43.73, "elapsed_time": "18:32:47", "remaining_time": "23:51:36"} +{"current_steps": 3099, "total_steps": 7063, "loss": 0.0043, "reward": -0.439, "learning_rate": 8.576178206933773e-06, "epoch": 0.44, "percentage": 43.88, "elapsed_time": "18:36:23", "remaining_time": "23:47:59"} +{"current_steps": 3109, "total_steps": 7063, "loss": 0.0048, "reward": -0.2539, "learning_rate": 8.637772360605421e-06, "epoch": 0.44, "percentage": 44.02, "elapsed_time": "18:39:54", "remaining_time": "23:44:17"} +{"current_steps": 3119, "total_steps": 7063, "loss": 0.0047, "reward": -0.4092, "learning_rate": 8.698215336458743e-06, "epoch": 0.44, "percentage": 44.16, "elapsed_time": "18:43:24", "remaining_time": "23:40:33"} +{"current_steps": 3129, "total_steps": 7063, "loss": 0.0042, "reward": -0.288, "learning_rate": 8.757488007235031e-06, "epoch": 0.44, "percentage": 44.3, "elapsed_time": "18:47:22", "remaining_time": "23:37:25"} +{"current_steps": 3139, "total_steps": 7063, "loss": 0.0033, "reward": -0.2841, "learning_rate": 8.815571616020147e-06, "epoch": 0.44, "percentage": 44.44, "elapsed_time": "18:50:58", "remaining_time": "23:33:48"} +{"current_steps": 3149, "total_steps": 7063, "loss": 0.0044, "reward": -0.3696, "learning_rate": 8.872447782180168e-06, "epoch": 0.45, "percentage": 44.58, "elapsed_time": "18:54:40", "remaining_time": "23:30:19"} +{"current_steps": 3159, "total_steps": 7063, "loss": 0.0034, "reward": -0.1236, "learning_rate": 8.92809850717797e-06, "epoch": 0.45, "percentage": 44.73, "elapsed_time": "18:58:18", "remaining_time": "23:26:46"} +{"current_steps": 3169, "total_steps": 7063, "loss": 0.0041, "reward": -0.269, "learning_rate": 8.982506180268895e-06, "epoch": 0.45, "percentage": 44.87, "elapsed_time": "19:02:04", "remaining_time": "23:23:20"} +{"current_steps": 3179, "total_steps": 7063, "loss": 0.0029, "reward": -0.4326, "learning_rate": 9.035653584073673e-06, "epoch": 0.45, "percentage": 45.01, "elapsed_time": "19:05:51", "remaining_time": "23:19:58"} +{"current_steps": 3189, "total_steps": 7063, "loss": 0.0038, "reward": -0.2885, "learning_rate": 9.087523900026907e-06, "epoch": 0.45, "percentage": 45.15, "elapsed_time": "19:09:24", "remaining_time": "23:16:18"} +{"current_steps": 3199, "total_steps": 7063, "loss": 0.0038, "reward": -0.3119, "learning_rate": 9.138100713699312e-06, "epoch": 0.45, "percentage": 45.29, "elapsed_time": "19:13:03", "remaining_time": "23:12:45"} +{"current_steps": 3209, "total_steps": 7063, "loss": 0.004, "reward": -0.196, "learning_rate": 9.187368019992092e-06, "epoch": 0.45, "percentage": 45.43, "elapsed_time": "19:16:29", "remaining_time": "23:08:56"} +{"current_steps": 3219, "total_steps": 7063, "loss": 0.0036, "reward": -0.3683, "learning_rate": 9.235310228201782e-06, "epoch": 0.46, "percentage": 45.58, "elapsed_time": "19:20:05", "remaining_time": "23:05:19"} +{"current_steps": 3229, "total_steps": 7063, "loss": 0.0035, "reward": -0.1997, "learning_rate": 9.281912166953929e-06, "epoch": 0.46, "percentage": 45.72, "elapsed_time": "19:23:47", "remaining_time": "23:01:51"} +{"current_steps": 3239, "total_steps": 7063, "loss": 0.0042, "reward": -0.403, "learning_rate": 9.327159089004098e-06, "epoch": 0.46, "percentage": 45.86, "elapsed_time": "19:27:19", "remaining_time": "22:58:09"} +{"current_steps": 3249, "total_steps": 7063, "loss": 0.0034, "reward": -0.3637, "learning_rate": 9.371036675904667e-06, "epoch": 0.46, "percentage": 46.0, "elapsed_time": "19:30:52", "remaining_time": "22:54:29"} +{"current_steps": 3259, "total_steps": 7063, "loss": 0.0049, "reward": -0.3766, "learning_rate": 9.413531042535915e-06, "epoch": 0.46, "percentage": 46.14, "elapsed_time": "19:34:25", "remaining_time": "22:50:48"} +{"current_steps": 3269, "total_steps": 7063, "loss": 0.0044, "reward": -0.3386, "learning_rate": 9.454628741499976e-06, "epoch": 0.46, "percentage": 46.28, "elapsed_time": "19:37:53", "remaining_time": "22:47:03"} +{"current_steps": 3279, "total_steps": 7063, "loss": 0.0039, "reward": -0.3232, "learning_rate": 9.494316767376295e-06, "epoch": 0.46, "percentage": 46.43, "elapsed_time": "19:41:27", "remaining_time": "22:43:24"} +{"current_steps": 3289, "total_steps": 7063, "loss": 0.0032, "reward": -0.3225, "learning_rate": 9.532582560837204e-06, "epoch": 0.47, "percentage": 46.57, "elapsed_time": "19:45:05", "remaining_time": "22:39:50"} +{"current_steps": 3299, "total_steps": 7063, "loss": 0.0037, "reward": -0.3366, "learning_rate": 9.569414012622356e-06, "epoch": 0.47, "percentage": 46.71, "elapsed_time": "19:48:41", "remaining_time": "22:36:14"} +{"current_steps": 3309, "total_steps": 7063, "loss": 0.0038, "reward": -0.3283, "learning_rate": 9.604799467370689e-06, "epoch": 0.47, "percentage": 46.85, "elapsed_time": "19:52:12", "remaining_time": "22:32:32"} +{"current_steps": 3319, "total_steps": 7063, "loss": 0.0033, "reward": -0.2504, "learning_rate": 9.63872772730879e-06, "epoch": 0.47, "percentage": 46.99, "elapsed_time": "19:55:46", "remaining_time": "22:28:53"} +{"current_steps": 3329, "total_steps": 7063, "loss": 0.0037, "reward": -0.3496, "learning_rate": 9.671188055794462e-06, "epoch": 0.47, "percentage": 47.13, "elapsed_time": "19:59:21", "remaining_time": "22:25:16"} +{"current_steps": 3339, "total_steps": 7063, "loss": 0.0035, "reward": -0.3135, "learning_rate": 9.702170180714328e-06, "epoch": 0.47, "percentage": 47.27, "elapsed_time": "20:02:57", "remaining_time": "22:21:40"} +{"current_steps": 3349, "total_steps": 7063, "loss": 0.0036, "reward": -0.3951, "learning_rate": 9.731664297734458e-06, "epoch": 0.47, "percentage": 47.42, "elapsed_time": "20:06:33", "remaining_time": "22:18:03"} +{"current_steps": 3359, "total_steps": 7063, "loss": 0.0032, "reward": -0.4631, "learning_rate": 9.75966107340297e-06, "epoch": 0.48, "percentage": 47.56, "elapsed_time": "20:10:22", "remaining_time": "22:14:41"} +{"current_steps": 3369, "total_steps": 7063, "loss": 0.0036, "reward": -0.3141, "learning_rate": 9.786151648103613e-06, "epoch": 0.48, "percentage": 47.7, "elapsed_time": "20:14:10", "remaining_time": "22:11:18"} +{"current_steps": 3379, "total_steps": 7063, "loss": 0.003, "reward": -0.1992, "learning_rate": 9.811127638859398e-06, "epoch": 0.48, "percentage": 47.84, "elapsed_time": "20:17:47", "remaining_time": "22:07:42"} +{"current_steps": 3389, "total_steps": 7063, "loss": 0.0038, "reward": -0.3201, "learning_rate": 9.834581141985404e-06, "epoch": 0.48, "percentage": 47.98, "elapsed_time": "20:21:19", "remaining_time": "22:04:01"} +{"current_steps": 3399, "total_steps": 7063, "loss": 0.0031, "reward": -0.1577, "learning_rate": 9.85650473558991e-06, "epoch": 0.48, "percentage": 48.12, "elapsed_time": "20:24:49", "remaining_time": "22:00:18"} +{"current_steps": 3409, "total_steps": 7063, "loss": 0.0035, "reward": -0.2635, "learning_rate": 9.876891481923067e-06, "epoch": 0.48, "percentage": 48.27, "elapsed_time": "20:28:20", "remaining_time": "21:56:37"} +{"current_steps": 3419, "total_steps": 7063, "loss": 0.0044, "reward": -0.3539, "learning_rate": 9.89573492957235e-06, "epoch": 0.48, "percentage": 48.41, "elapsed_time": "20:32:02", "remaining_time": "21:53:06"} +{"current_steps": 3429, "total_steps": 7063, "loss": 0.0031, "reward": -0.3358, "learning_rate": 9.91302911550412e-06, "epoch": 0.49, "percentage": 48.55, "elapsed_time": "20:35:39", "remaining_time": "21:49:31"} +{"current_steps": 3439, "total_steps": 7063, "loss": 0.0041, "reward": -0.2885, "learning_rate": 9.928768566950632e-06, "epoch": 0.49, "percentage": 48.69, "elapsed_time": "20:39:15", "remaining_time": "21:45:55"} +{"current_steps": 3449, "total_steps": 7063, "loss": 0.0037, "reward": -0.2699, "learning_rate": 9.94294830314191e-06, "epoch": 0.49, "percentage": 48.83, "elapsed_time": "20:42:56", "remaining_time": "21:42:24"} +{"current_steps": 3459, "total_steps": 7063, "loss": 0.0053, "reward": -0.317, "learning_rate": 9.955563836881898e-06, "epoch": 0.49, "percentage": 48.97, "elapsed_time": "20:46:32", "remaining_time": "21:38:48"} +{"current_steps": 3469, "total_steps": 7063, "loss": 0.0035, "reward": -0.2824, "learning_rate": 9.966611175968454e-06, "epoch": 0.49, "percentage": 49.12, "elapsed_time": "20:50:14", "remaining_time": "21:35:17"} +{"current_steps": 3479, "total_steps": 7063, "loss": 0.004, "reward": -0.5046, "learning_rate": 9.976086824456686e-06, "epoch": 0.49, "percentage": 49.26, "elapsed_time": "20:53:51", "remaining_time": "21:31:41"} +{"current_steps": 3489, "total_steps": 7063, "loss": 0.0036, "reward": -0.4293, "learning_rate": 9.983987783765243e-06, "epoch": 0.49, "percentage": 49.4, "elapsed_time": "20:57:28", "remaining_time": "21:28:06"} +{"current_steps": 3499, "total_steps": 7063, "loss": 0.0034, "reward": -0.1845, "learning_rate": 9.990311553625227e-06, "epoch": 0.5, "percentage": 49.54, "elapsed_time": "21:00:57", "remaining_time": "21:24:23"} +{"current_steps": 3509, "total_steps": 7063, "loss": 0.0035, "reward": -0.1239, "learning_rate": 9.995056132871399e-06, "epoch": 0.5, "percentage": 49.68, "elapsed_time": "21:04:40", "remaining_time": "21:20:53"} +{"current_steps": 3519, "total_steps": 7063, "loss": 0.0031, "reward": -0.271, "learning_rate": 9.998220020075455e-06, "epoch": 0.5, "percentage": 49.82, "elapsed_time": "21:08:20", "remaining_time": "21:17:20"} +{"current_steps": 3529, "total_steps": 7063, "loss": 0.0039, "reward": -0.4751, "learning_rate": 9.999802214021156e-06, "epoch": 0.5, "percentage": 49.96, "elapsed_time": "21:11:50", "remaining_time": "21:13:38"} +{"current_steps": 3539, "total_steps": 7063, "loss": 0.0038, "reward": -0.454, "learning_rate": 9.999802214021156e-06, "epoch": 0.5, "percentage": 50.11, "elapsed_time": "21:15:28", "remaining_time": "21:10:04"} +{"current_steps": 3549, "total_steps": 7063, "loss": 0.0041, "reward": -0.1722, "learning_rate": 9.998220020075455e-06, "epoch": 0.5, "percentage": 50.25, "elapsed_time": "21:19:02", "remaining_time": "21:06:25"} +{"current_steps": 3559, "total_steps": 7063, "loss": 0.0041, "reward": -0.2842, "learning_rate": 9.9950561328714e-06, "epoch": 0.5, "percentage": 50.39, "elapsed_time": "21:22:32", "remaining_time": "21:02:43"} +{"current_steps": 3569, "total_steps": 7063, "loss": 0.0042, "reward": -0.3914, "learning_rate": 9.990311553625229e-06, "epoch": 0.51, "percentage": 50.53, "elapsed_time": "21:26:08", "remaining_time": "20:59:07"} +{"current_steps": 3579, "total_steps": 7063, "loss": 0.0038, "reward": -0.1993, "learning_rate": 9.983987783765245e-06, "epoch": 0.51, "percentage": 50.67, "elapsed_time": "21:29:45", "remaining_time": "20:55:31"} +{"current_steps": 3589, "total_steps": 7063, "loss": 0.0029, "reward": -0.3465, "learning_rate": 9.976086824456686e-06, "epoch": 0.51, "percentage": 50.81, "elapsed_time": "21:33:28", "remaining_time": "20:52:02"} +{"current_steps": 3599, "total_steps": 7063, "loss": 0.0034, "reward": -0.209, "learning_rate": 9.966611175968454e-06, "epoch": 0.51, "percentage": 50.96, "elapsed_time": "21:37:19", "remaining_time": "20:48:39"} +{"current_steps": 3609, "total_steps": 7063, "loss": 0.0032, "reward": -0.2638, "learning_rate": 9.955563836881898e-06, "epoch": 0.51, "percentage": 51.1, "elapsed_time": "21:40:55", "remaining_time": "20:45:03"} +{"current_steps": 3619, "total_steps": 7063, "loss": 0.0032, "reward": -0.2811, "learning_rate": 9.94294830314191e-06, "epoch": 0.51, "percentage": 51.24, "elapsed_time": "21:44:31", "remaining_time": "20:41:26"} +{"current_steps": 3629, "total_steps": 7063, "loss": 0.0038, "reward": -0.3794, "learning_rate": 9.928768566950635e-06, "epoch": 0.51, "percentage": 51.38, "elapsed_time": "21:48:19", "remaining_time": "20:38:01"} +{"current_steps": 3639, "total_steps": 7063, "loss": 0.0038, "reward": -0.3419, "learning_rate": 9.91302911550412e-06, "epoch": 0.52, "percentage": 51.52, "elapsed_time": "21:51:59", "remaining_time": "20:34:28"} +{"current_steps": 3649, "total_steps": 7063, "loss": 0.0032, "reward": -0.31, "learning_rate": 9.89573492957235e-06, "epoch": 0.52, "percentage": 51.66, "elapsed_time": "21:55:38", "remaining_time": "20:30:54"} +{"current_steps": 3659, "total_steps": 7063, "loss": 0.0034, "reward": -0.1604, "learning_rate": 9.876891481923067e-06, "epoch": 0.52, "percentage": 51.81, "elapsed_time": "21:59:16", "remaining_time": "20:27:20"} +{"current_steps": 3669, "total_steps": 7063, "loss": 0.0035, "reward": -0.1379, "learning_rate": 9.85650473558991e-06, "epoch": 0.52, "percentage": 51.95, "elapsed_time": "22:02:50", "remaining_time": "20:23:41"} +{"current_steps": 3679, "total_steps": 7063, "loss": 0.0038, "reward": -0.3531, "learning_rate": 9.834581141985404e-06, "epoch": 0.52, "percentage": 52.09, "elapsed_time": "22:06:38", "remaining_time": "20:20:16"} +{"current_steps": 3689, "total_steps": 7063, "loss": 0.0028, "reward": -0.1161, "learning_rate": 9.811127638859398e-06, "epoch": 0.52, "percentage": 52.23, "elapsed_time": "22:10:25", "remaining_time": "20:16:49"} +{"current_steps": 3699, "total_steps": 7063, "loss": 0.0038, "reward": -0.3628, "learning_rate": 9.786151648103615e-06, "epoch": 0.52, "percentage": 52.37, "elapsed_time": "22:13:55", "remaining_time": "20:13:06"} +{"current_steps": 3709, "total_steps": 7063, "loss": 0.0033, "reward": -0.3243, "learning_rate": 9.759661073402971e-06, "epoch": 0.53, "percentage": 52.51, "elapsed_time": "22:17:26", "remaining_time": "20:09:25"} +{"current_steps": 3719, "total_steps": 7063, "loss": 0.0028, "reward": -0.2481, "learning_rate": 9.731664297734458e-06, "epoch": 0.53, "percentage": 52.65, "elapsed_time": "22:21:03", "remaining_time": "20:05:49"} +{"current_steps": 3729, "total_steps": 7063, "loss": 0.0038, "reward": -0.3179, "learning_rate": 9.702170180714325e-06, "epoch": 0.53, "percentage": 52.8, "elapsed_time": "22:24:43", "remaining_time": "20:02:17"} +{"current_steps": 3739, "total_steps": 7063, "loss": 0.0028, "reward": -0.1725, "learning_rate": 9.671188055794462e-06, "epoch": 0.53, "percentage": 52.94, "elapsed_time": "22:28:27", "remaining_time": "19:58:47"} +{"current_steps": 3749, "total_steps": 7063, "loss": 0.003, "reward": -0.1697, "learning_rate": 9.63872772730879e-06, "epoch": 0.53, "percentage": 53.08, "elapsed_time": "22:32:01", "remaining_time": "19:55:08"} +{"current_steps": 3759, "total_steps": 7063, "loss": 0.0035, "reward": -0.2575, "learning_rate": 9.604799467370689e-06, "epoch": 0.53, "percentage": 53.22, "elapsed_time": "22:35:40", "remaining_time": "19:51:35"} +{"current_steps": 3769, "total_steps": 7063, "loss": 0.0043, "reward": -0.3233, "learning_rate": 9.569414012622358e-06, "epoch": 0.53, "percentage": 53.36, "elapsed_time": "22:39:21", "remaining_time": "19:48:02"} +{"current_steps": 3779, "total_steps": 7063, "loss": 0.0031, "reward": -0.0708, "learning_rate": 9.532582560837208e-06, "epoch": 0.54, "percentage": 53.5, "elapsed_time": "22:42:57", "remaining_time": "19:44:25"} +{"current_steps": 3789, "total_steps": 7063, "loss": 0.003, "reward": -0.2344, "learning_rate": 9.494316767376295e-06, "epoch": 0.54, "percentage": 53.65, "elapsed_time": "22:46:33", "remaining_time": "19:40:48"} +{"current_steps": 3799, "total_steps": 7063, "loss": 0.0036, "reward": -0.0844, "learning_rate": 9.454628741499978e-06, "epoch": 0.54, "percentage": 53.79, "elapsed_time": "22:50:00", "remaining_time": "19:37:04"} +{"current_steps": 3809, "total_steps": 7063, "loss": 0.0034, "reward": -0.2369, "learning_rate": 9.413531042535916e-06, "epoch": 0.54, "percentage": 53.93, "elapsed_time": "22:53:32", "remaining_time": "19:33:24"} +{"current_steps": 3819, "total_steps": 7063, "loss": 0.0036, "reward": -0.3654, "learning_rate": 9.371036675904671e-06, "epoch": 0.54, "percentage": 54.07, "elapsed_time": "22:57:04", "remaining_time": "19:29:44"} +{"current_steps": 3829, "total_steps": 7063, "loss": 0.0036, "reward": -0.2757, "learning_rate": 9.327159089004098e-06, "epoch": 0.54, "percentage": 54.21, "elapsed_time": "23:00:40", "remaining_time": "19:26:07"} +{"current_steps": 3839, "total_steps": 7063, "loss": 0.0035, "reward": -0.3181, "learning_rate": 9.281912166953932e-06, "epoch": 0.54, "percentage": 54.35, "elapsed_time": "23:04:19", "remaining_time": "19:22:33"} +{"current_steps": 3849, "total_steps": 7063, "loss": 0.0048, "reward": -0.3122, "learning_rate": 9.235310228201784e-06, "epoch": 0.54, "percentage": 54.5, "elapsed_time": "23:07:53", "remaining_time": "19:18:55"} +{"current_steps": 3859, "total_steps": 7063, "loss": 0.0033, "reward": -0.2904, "learning_rate": 9.187368019992095e-06, "epoch": 0.55, "percentage": 54.64, "elapsed_time": "23:11:25", "remaining_time": "19:15:14"} +{"current_steps": 3869, "total_steps": 7063, "loss": 0.0037, "reward": -0.1489, "learning_rate": 9.138100713699312e-06, "epoch": 0.55, "percentage": 54.78, "elapsed_time": "23:14:57", "remaining_time": "19:11:34"} +{"current_steps": 3879, "total_steps": 7063, "loss": 0.0029, "reward": -0.2763, "learning_rate": 9.087523900026905e-06, "epoch": 0.55, "percentage": 54.92, "elapsed_time": "23:18:43", "remaining_time": "19:08:06"} +{"current_steps": 3889, "total_steps": 7063, "loss": 0.003, "reward": -0.1622, "learning_rate": 9.035653584073675e-06, "epoch": 0.55, "percentage": 55.06, "elapsed_time": "23:22:34", "remaining_time": "19:04:42"} +{"current_steps": 3899, "total_steps": 7063, "loss": 0.0034, "reward": -0.3107, "learning_rate": 8.982506180268893e-06, "epoch": 0.55, "percentage": 55.2, "elapsed_time": "23:26:10", "remaining_time": "19:01:06"} +{"current_steps": 3909, "total_steps": 7063, "loss": 0.0033, "reward": -0.1224, "learning_rate": 8.928098507177972e-06, "epoch": 0.55, "percentage": 55.34, "elapsed_time": "23:29:40", "remaining_time": "18:57:24"} +{"current_steps": 3919, "total_steps": 7063, "loss": 0.0038, "reward": -0.1105, "learning_rate": 8.872447782180166e-06, "epoch": 0.55, "percentage": 55.49, "elapsed_time": "23:33:12", "remaining_time": "18:53:44"} +{"current_steps": 3929, "total_steps": 7063, "loss": 0.0031, "reward": -0.348, "learning_rate": 8.815571616020149e-06, "epoch": 0.56, "percentage": 55.63, "elapsed_time": "23:36:58", "remaining_time": "18:50:15"} +{"current_steps": 3939, "total_steps": 7063, "loss": 0.0035, "reward": -0.2409, "learning_rate": 8.757488007235031e-06, "epoch": 0.56, "percentage": 55.77, "elapsed_time": "23:40:39", "remaining_time": "18:46:43"} +{"current_steps": 3949, "total_steps": 7063, "loss": 0.0033, "reward": -0.3141, "learning_rate": 8.698215336458744e-06, "epoch": 0.56, "percentage": 55.91, "elapsed_time": "23:44:14", "remaining_time": "18:43:05"} +{"current_steps": 3959, "total_steps": 7063, "loss": 0.0034, "reward": -0.313, "learning_rate": 8.637772360605418e-06, "epoch": 0.56, "percentage": 56.05, "elapsed_time": "23:47:50", "remaining_time": "18:39:29"} +{"current_steps": 3969, "total_steps": 7063, "loss": 0.0046, "reward": -0.4326, "learning_rate": 8.576178206933775e-06, "epoch": 0.56, "percentage": 56.19, "elapsed_time": "23:51:21", "remaining_time": "18:35:47"} +{"current_steps": 3979, "total_steps": 7063, "loss": 0.003, "reward": -0.1198, "learning_rate": 8.513452366994239e-06, "epoch": 0.56, "percentage": 56.34, "elapsed_time": "23:55:04", "remaining_time": "18:32:17"} +{"current_steps": 3989, "total_steps": 7063, "loss": 0.0032, "reward": -0.1191, "learning_rate": 8.44961469046086e-06, "epoch": 0.56, "percentage": 56.48, "elapsed_time": "23:58:39", "remaining_time": "18:28:39"} +{"current_steps": 3999, "total_steps": 7063, "loss": 0.0041, "reward": -0.3557, "learning_rate": 8.384685378849806e-06, "epoch": 0.57, "percentage": 56.62, "elapsed_time": "1 day, 0:02:05", "remaining_time": "18:24:55"} +{"current_steps": 4009, "total_steps": 7063, "loss": 0.0035, "reward": -0.2939, "learning_rate": 8.318684979126612e-06, "epoch": 0.57, "percentage": 56.76, "elapsed_time": "1 day, 0:05:45", "remaining_time": "18:21:21"} +{"current_steps": 4019, "total_steps": 7063, "loss": 0.0049, "reward": -0.1952, "learning_rate": 8.251634377204026e-06, "epoch": 0.57, "percentage": 56.9, "elapsed_time": "1 day, 0:09:20", "remaining_time": "18:17:43"} +{"current_steps": 4029, "total_steps": 7063, "loss": 0.0029, "reward": -0.1551, "learning_rate": 8.183554791332677e-06, "epoch": 0.57, "percentage": 57.04, "elapsed_time": "1 day, 0:12:58", "remaining_time": "18:14:08"} +{"current_steps": 4039, "total_steps": 7063, "loss": 0.0043, "reward": -0.2539, "learning_rate": 8.114467765386494e-06, "epoch": 0.57, "percentage": 57.19, "elapsed_time": "1 day, 0:16:28", "remaining_time": "18:10:27"} +{"current_steps": 4049, "total_steps": 7063, "loss": 0.0037, "reward": -0.3849, "learning_rate": 8.04439516204514e-06, "epoch": 0.57, "percentage": 57.33, "elapsed_time": "1 day, 0:20:05", "remaining_time": "18:06:52"} +{"current_steps": 4059, "total_steps": 7063, "loss": 0.0028, "reward": -0.2593, "learning_rate": 7.973359155875525e-06, "epoch": 0.57, "percentage": 57.47, "elapsed_time": "1 day, 0:23:47", "remaining_time": "18:03:20"} +{"current_steps": 4069, "total_steps": 7063, "loss": 0.0032, "reward": -0.1569, "learning_rate": 7.901382226314662e-06, "epoch": 0.58, "percentage": 57.61, "elapsed_time": "1 day, 0:27:23", "remaining_time": "17:59:43"} +{"current_steps": 4079, "total_steps": 7063, "loss": 0.0035, "reward": -0.4049, "learning_rate": 7.82848715055598e-06, "epoch": 0.58, "percentage": 57.75, "elapsed_time": "1 day, 0:31:06", "remaining_time": "17:56:11"} +{"current_steps": 4089, "total_steps": 7063, "loss": 0.0031, "reward": -0.3131, "learning_rate": 7.75469699634149e-06, "epoch": 0.58, "percentage": 57.89, "elapsed_time": "1 day, 0:34:39", "remaining_time": "17:52:32"} +{"current_steps": 4099, "total_steps": 7063, "loss": 0.0033, "reward": -0.2798, "learning_rate": 7.68003511466193e-06, "epoch": 0.58, "percentage": 58.03, "elapsed_time": "1 day, 0:38:13", "remaining_time": "17:48:54"} +{"current_steps": 4109, "total_steps": 7063, "loss": 0.0034, "reward": -0.2349, "learning_rate": 7.604525132367354e-06, "epoch": 0.58, "percentage": 58.18, "elapsed_time": "1 day, 0:41:51", "remaining_time": "17:45:19"} +{"current_steps": 4119, "total_steps": 7063, "loss": 0.0034, "reward": -0.1358, "learning_rate": 7.528190944690358e-06, "epoch": 0.58, "percentage": 58.32, "elapsed_time": "1 day, 0:45:18", "remaining_time": "17:41:36"} +{"current_steps": 4129, "total_steps": 7063, "loss": 0.0034, "reward": -0.1241, "learning_rate": 7.4510567076843945e-06, "epoch": 0.58, "percentage": 58.46, "elapsed_time": "1 day, 0:48:42", "remaining_time": "17:37:51"} +{"current_steps": 4139, "total_steps": 7063, "loss": 0.0031, "reward": -0.0964, "learning_rate": 7.373146830579598e-06, "epoch": 0.59, "percentage": 58.6, "elapsed_time": "1 day, 0:52:15", "remaining_time": "17:34:12"} +{"current_steps": 4149, "total_steps": 7063, "loss": 0.003, "reward": -0.064, "learning_rate": 7.294485968058401e-06, "epoch": 0.59, "percentage": 58.74, "elapsed_time": "1 day, 0:55:49", "remaining_time": "17:30:34"} +{"current_steps": 4159, "total_steps": 7063, "loss": 0.0031, "reward": -0.2023, "learning_rate": 7.2150990124535726e-06, "epoch": 0.59, "percentage": 58.88, "elapsed_time": "1 day, 0:59:28", "remaining_time": "17:27:00"} +{"current_steps": 4169, "total_steps": 7063, "loss": 0.0035, "reward": -0.3227, "learning_rate": 7.135011085870962e-06, "epoch": 0.59, "percentage": 59.03, "elapsed_time": "1 day, 1:03:12", "remaining_time": "17:23:29"} +{"current_steps": 4179, "total_steps": 7063, "loss": 0.003, "reward": -0.1747, "learning_rate": 7.054247532239637e-06, "epoch": 0.59, "percentage": 59.17, "elapsed_time": "1 day, 1:06:48", "remaining_time": "17:19:52"} +{"current_steps": 4189, "total_steps": 7063, "loss": 0.003, "reward": -0.1391, "learning_rate": 6.9728339092916915e-06, "epoch": 0.59, "percentage": 59.31, "elapsed_time": "1 day, 1:10:19", "remaining_time": "17:16:12"} +{"current_steps": 4199, "total_steps": 7063, "loss": 0.0029, "reward": -0.1152, "learning_rate": 6.890795980474532e-06, "epoch": 0.59, "percentage": 59.45, "elapsed_time": "1 day, 1:13:55", "remaining_time": "17:12:35"} +{"current_steps": 4209, "total_steps": 7063, "loss": 0.0027, "reward": -0.225, "learning_rate": 6.808159706797946e-06, "epoch": 0.6, "percentage": 59.59, "elapsed_time": "1 day, 1:17:24", "remaining_time": "17:08:54"} +{"current_steps": 4219, "total_steps": 7063, "loss": 0.0035, "reward": -0.107, "learning_rate": 6.72495123861877e-06, "epoch": 0.6, "percentage": 59.73, "elapsed_time": "1 day, 1:20:55", "remaining_time": "17:05:14"} +{"current_steps": 4229, "total_steps": 7063, "loss": 0.0037, "reward": -0.213, "learning_rate": 6.6411969073655014e-06, "epoch": 0.6, "percentage": 59.88, "elapsed_time": "1 day, 1:24:32", "remaining_time": "17:01:38"} +{"current_steps": 4239, "total_steps": 7063, "loss": 0.0029, "reward": -0.2639, "learning_rate": 6.55692321720575e-06, "epoch": 0.6, "percentage": 60.02, "elapsed_time": "1 day, 1:28:15", "remaining_time": "16:58:07"} +{"current_steps": 4249, "total_steps": 7063, "loss": 0.0034, "reward": -0.1981, "learning_rate": 6.472156836658903e-06, "epoch": 0.6, "percentage": 60.16, "elapsed_time": "1 day, 1:31:44", "remaining_time": "16:54:25"} +{"current_steps": 4259, "total_steps": 7063, "loss": 0.0035, "reward": -0.1908, "learning_rate": 6.386924590156898e-06, "epoch": 0.6, "percentage": 60.3, "elapsed_time": "1 day, 1:35:28", "remaining_time": "16:50:54"} +{"current_steps": 4269, "total_steps": 7063, "loss": 0.0028, "reward": -0.2391, "learning_rate": 6.301253449555531e-06, "epoch": 0.6, "percentage": 60.44, "elapsed_time": "1 day, 1:39:12", "remaining_time": "16:47:23"} +{"current_steps": 4279, "total_steps": 7063, "loss": 0.0032, "reward": -0.2446, "learning_rate": 6.215170525599231e-06, "epoch": 0.61, "percentage": 60.58, "elapsed_time": "1 day, 1:42:43", "remaining_time": "16:43:43"} +{"current_steps": 4289, "total_steps": 7063, "loss": 0.0032, "reward": -0.2266, "learning_rate": 6.128703059341789e-06, "epoch": 0.61, "percentage": 60.72, "elapsed_time": "1 day, 1:46:20", "remaining_time": "16:40:07"} +{"current_steps": 4299, "total_steps": 7063, "loss": 0.0032, "reward": -0.1362, "learning_rate": 6.041878413525939e-06, "epoch": 0.61, "percentage": 60.87, "elapsed_time": "1 day, 1:49:55", "remaining_time": "16:36:30"} +{"current_steps": 4309, "total_steps": 7063, "loss": 0.0035, "reward": -0.2071, "learning_rate": 5.9547240639243184e-06, "epoch": 0.61, "percentage": 61.01, "elapsed_time": "1 day, 1:53:37", "remaining_time": "16:32:58"} +{"current_steps": 4319, "total_steps": 7063, "loss": 0.0035, "reward": -0.2041, "learning_rate": 5.867267590644787e-06, "epoch": 0.61, "percentage": 61.15, "elapsed_time": "1 day, 1:57:15", "remaining_time": "16:29:22"} +{"current_steps": 4329, "total_steps": 7063, "loss": 0.0029, "reward": -0.2125, "learning_rate": 5.779536669402611e-06, "epoch": 0.61, "percentage": 61.29, "elapsed_time": "1 day, 2:01:00", "remaining_time": "16:25:51"} +{"current_steps": 4339, "total_steps": 7063, "loss": 0.0033, "reward": -0.3047, "learning_rate": 5.6915590627625005e-06, "epoch": 0.61, "percentage": 61.43, "elapsed_time": "1 day, 2:04:38", "remaining_time": "16:22:16"} +{"current_steps": 4349, "total_steps": 7063, "loss": 0.0028, "reward": -0.2644, "learning_rate": 5.60336261135307e-06, "epoch": 0.62, "percentage": 61.57, "elapsed_time": "1 day, 2:08:20", "remaining_time": "16:18:43"} +{"current_steps": 4359, "total_steps": 7063, "loss": 0.0032, "reward": -0.2142, "learning_rate": 5.514975225056633e-06, "epoch": 0.62, "percentage": 61.72, "elapsed_time": "1 day, 2:11:52", "remaining_time": "16:15:04"} +{"current_steps": 4369, "total_steps": 7063, "loss": 0.0036, "reward": -0.2406, "learning_rate": 5.4264248741771295e-06, "epoch": 0.62, "percentage": 61.86, "elapsed_time": "1 day, 2:15:40", "remaining_time": "16:11:34"} +{"current_steps": 4379, "total_steps": 7063, "loss": 0.0035, "reward": -0.4047, "learning_rate": 5.337739580588822e-06, "epoch": 0.62, "percentage": 62.0, "elapsed_time": "1 day, 2:19:14", "remaining_time": "16:07:57"} +{"current_steps": 4389, "total_steps": 7063, "loss": 0.0034, "reward": -0.1619, "learning_rate": 5.248947408868794e-06, "epoch": 0.62, "percentage": 62.14, "elapsed_time": "1 day, 2:22:43", "remaining_time": "16:04:16"} +{"current_steps": 4399, "total_steps": 7063, "loss": 0.0028, "reward": -0.1479, "learning_rate": 5.16007645741583e-06, "epoch": 0.62, "percentage": 62.28, "elapsed_time": "1 day, 2:26:21", "remaining_time": "16:00:41"} +{"current_steps": 4409, "total_steps": 7063, "loss": 0.0034, "reward": -0.1027, "learning_rate": 5.071154849558695e-06, "epoch": 0.62, "percentage": 62.42, "elapsed_time": "1 day, 2:29:53", "remaining_time": "15:57:02"} +{"current_steps": 4419, "total_steps": 7063, "loss": 0.0034, "reward": -0.2996, "learning_rate": 4.982210724656409e-06, "epoch": 0.63, "percentage": 62.57, "elapsed_time": "1 day, 2:33:26", "remaining_time": "15:53:23"} +{"current_steps": 4429, "total_steps": 7063, "loss": 0.0028, "reward": -0.0919, "learning_rate": 4.893272229193561e-06, "epoch": 0.63, "percentage": 62.71, "elapsed_time": "1 day, 2:37:10", "remaining_time": "15:49:52"} +{"current_steps": 4439, "total_steps": 7063, "loss": 0.003, "reward": -0.1089, "learning_rate": 4.804367507873277e-06, "epoch": 0.63, "percentage": 62.85, "elapsed_time": "1 day, 2:40:48", "remaining_time": "15:46:16"} +{"current_steps": 4449, "total_steps": 7063, "loss": 0.0031, "reward": -0.1168, "learning_rate": 4.715524694710839e-06, "epoch": 0.63, "percentage": 62.99, "elapsed_time": "1 day, 2:44:34", "remaining_time": "15:42:45"} +{"current_steps": 4459, "total_steps": 7063, "loss": 0.0034, "reward": -0.3128, "learning_rate": 4.626771904130584e-06, "epoch": 0.63, "percentage": 63.13, "elapsed_time": "1 day, 2:48:08", "remaining_time": "15:39:08"} +{"current_steps": 4469, "total_steps": 7063, "loss": 0.0041, "reward": -0.1848, "learning_rate": 4.538137222069105e-06, "epoch": 0.63, "percentage": 63.27, "elapsed_time": "1 day, 2:51:34", "remaining_time": "15:35:25"} +{"current_steps": 4479, "total_steps": 7063, "loss": 0.0032, "reward": -0.1865, "learning_rate": 4.449648697087378e-06, "epoch": 0.63, "percentage": 63.41, "elapsed_time": "1 day, 2:55:17", "remaining_time": "15:31:53"} +{"current_steps": 4489, "total_steps": 7063, "loss": 0.0027, "reward": -0.1697, "learning_rate": 4.361334331494812e-06, "epoch": 0.64, "percentage": 63.56, "elapsed_time": "1 day, 2:58:57", "remaining_time": "15:28:18"} +{"current_steps": 4499, "total_steps": 7063, "loss": 0.0035, "reward": -0.1667, "learning_rate": 4.2732220724878194e-06, "epoch": 0.64, "percentage": 63.7, "elapsed_time": "1 day, 3:02:27", "remaining_time": "15:24:38"} +{"current_steps": 4509, "total_steps": 7063, "loss": 0.0038, "reward": -0.3111, "learning_rate": 4.185339803305934e-06, "epoch": 0.64, "percentage": 63.84, "elapsed_time": "1 day, 3:06:03", "remaining_time": "15:21:02"} +{"current_steps": 4519, "total_steps": 7063, "loss": 0.003, "reward": -0.2045, "learning_rate": 4.097715334408112e-06, "epoch": 0.64, "percentage": 63.98, "elapsed_time": "1 day, 3:09:40", "remaining_time": "15:17:26"} +{"current_steps": 4529, "total_steps": 7063, "loss": 0.0031, "reward": -0.152, "learning_rate": 4.010376394672062e-06, "epoch": 0.64, "percentage": 64.12, "elapsed_time": "1 day, 3:13:05", "remaining_time": "15:13:43"} +{"current_steps": 4539, "total_steps": 7063, "loss": 0.003, "reward": -0.2064, "learning_rate": 3.9233506226194126e-06, "epoch": 0.64, "percentage": 64.26, "elapsed_time": "1 day, 3:16:46", "remaining_time": "15:10:09"} +{"current_steps": 4549, "total_steps": 7063, "loss": 0.0034, "reward": -0.2407, "learning_rate": 3.836665557669496e-06, "epoch": 0.64, "percentage": 64.41, "elapsed_time": "1 day, 3:20:20", "remaining_time": "15:06:31"} +{"current_steps": 4559, "total_steps": 7063, "loss": 0.0029, "reward": -0.1174, "learning_rate": 3.750348631424402e-06, "epoch": 0.65, "percentage": 64.55, "elapsed_time": "1 day, 3:23:59", "remaining_time": "15:02:57"} +{"current_steps": 4569, "total_steps": 7063, "loss": 0.003, "reward": -0.2606, "learning_rate": 3.66442715898827e-06, "epoch": 0.65, "percentage": 64.69, "elapsed_time": "1 day, 3:27:19", "remaining_time": "14:59:11"} +{"current_steps": 4579, "total_steps": 7063, "loss": 0.003, "reward": -0.1689, "learning_rate": 3.578928330323367e-06, "epoch": 0.65, "percentage": 64.83, "elapsed_time": "1 day, 3:30:59", "remaining_time": "14:55:37"} +{"current_steps": 4589, "total_steps": 7063, "loss": 0.0028, "reward": -0.2151, "learning_rate": 3.493879201645759e-06, "epoch": 0.65, "percentage": 64.97, "elapsed_time": "1 day, 3:34:36", "remaining_time": "14:52:01"} +{"current_steps": 4599, "total_steps": 7063, "loss": 0.0029, "reward": -0.1513, "learning_rate": 3.409306686863399e-06, "epoch": 0.65, "percentage": 65.11, "elapsed_time": "1 day, 3:38:20", "remaining_time": "14:48:29"} +{"current_steps": 4609, "total_steps": 7063, "loss": 0.0026, "reward": -0.0821, "learning_rate": 3.3252375490591217e-06, "epoch": 0.65, "percentage": 65.26, "elapsed_time": "1 day, 3:42:06", "remaining_time": "14:44:57"} +{"current_steps": 4619, "total_steps": 7063, "loss": 0.0034, "reward": -0.2608, "learning_rate": 3.24169839202147e-06, "epoch": 0.65, "percentage": 65.4, "elapsed_time": "1 day, 3:45:31", "remaining_time": "14:41:15"} +{"current_steps": 4629, "total_steps": 7063, "loss": 0.0028, "reward": -0.132, "learning_rate": 3.158715651825871e-06, "epoch": 0.66, "percentage": 65.54, "elapsed_time": "1 day, 3:49:17", "remaining_time": "14:37:44"} +{"current_steps": 4639, "total_steps": 7063, "loss": 0.0028, "reward": -0.0714, "learning_rate": 3.076315588468941e-06, "epoch": 0.66, "percentage": 65.68, "elapsed_time": "1 day, 3:52:55", "remaining_time": "14:34:09"} +{"current_steps": 4649, "total_steps": 7063, "loss": 0.0032, "reward": -0.2108, "learning_rate": 2.9945242775584143e-06, "epoch": 0.66, "percentage": 65.82, "elapsed_time": "1 day, 3:56:23", "remaining_time": "14:30:28"} +{"current_steps": 4659, "total_steps": 7063, "loss": 0.0027, "reward": -0.0474, "learning_rate": 2.913367602061552e-06, "epoch": 0.66, "percentage": 65.96, "elapsed_time": "1 day, 4:00:02", "remaining_time": "14:26:53"} +{"current_steps": 4669, "total_steps": 7063, "loss": 0.0033, "reward": -0.287, "learning_rate": 2.832871244114375e-06, "epoch": 0.66, "percentage": 66.11, "elapsed_time": "1 day, 4:03:44", "remaining_time": "14:23:19"} +{"current_steps": 4679, "total_steps": 7063, "loss": 0.0029, "reward": -0.2081, "learning_rate": 2.753060676894588e-06, "epoch": 0.66, "percentage": 66.25, "elapsed_time": "1 day, 4:07:17", "remaining_time": "14:19:41"} +{"current_steps": 4689, "total_steps": 7063, "loss": 0.0036, "reward": -0.1504, "learning_rate": 2.6739611565604947e-06, "epoch": 0.66, "percentage": 66.39, "elapsed_time": "1 day, 4:11:01", "remaining_time": "14:16:08"} +{"current_steps": 4699, "total_steps": 7063, "loss": 0.0033, "reward": -0.2813, "learning_rate": 2.5955977142586946e-06, "epoch": 0.67, "percentage": 66.53, "elapsed_time": "1 day, 4:14:24", "remaining_time": "14:12:25"} +{"current_steps": 4709, "total_steps": 7063, "loss": 0.0029, "reward": -0.3317, "learning_rate": 2.5179951482029225e-06, "epoch": 0.67, "percentage": 66.67, "elapsed_time": "1 day, 4:18:03", "remaining_time": "14:08:50"} +{"current_steps": 4719, "total_steps": 7063, "loss": 0.0029, "reward": -0.1715, "learning_rate": 2.4411780158266533e-06, "epoch": 0.67, "percentage": 66.81, "elapsed_time": "1 day, 4:21:35", "remaining_time": "14:05:12"} +{"current_steps": 4729, "total_steps": 7063, "loss": 0.0029, "reward": -0.1342, "learning_rate": 2.3651706260118184e-06, "epoch": 0.67, "percentage": 66.95, "elapsed_time": "1 day, 4:25:05", "remaining_time": "14:01:32"} +{"current_steps": 4739, "total_steps": 7063, "loss": 0.0032, "reward": -0.0324, "learning_rate": 2.289997031396286e-06, "epoch": 0.67, "percentage": 67.1, "elapsed_time": "1 day, 4:28:45", "remaining_time": "13:57:58"} +{"current_steps": 4749, "total_steps": 7063, "loss": 0.0032, "reward": -0.1613, "learning_rate": 2.215681020762313e-06, "epoch": 0.67, "percentage": 67.24, "elapsed_time": "1 day, 4:32:16", "remaining_time": "13:54:19"} +{"current_steps": 4759, "total_steps": 7063, "loss": 0.0027, "reward": -0.2861, "learning_rate": 2.1422461115086167e-06, "epoch": 0.67, "percentage": 67.38, "elapsed_time": "1 day, 4:35:56", "remaining_time": "13:50:44"} +{"current_steps": 4769, "total_steps": 7063, "loss": 0.0026, "reward": -0.181, "learning_rate": 2.069715542208207e-06, "epoch": 0.68, "percentage": 67.52, "elapsed_time": "1 day, 4:39:29", "remaining_time": "13:47:07"} +{"current_steps": 4779, "total_steps": 7063, "loss": 0.0028, "reward": -0.1974, "learning_rate": 1.998112265254541e-06, "epoch": 0.68, "percentage": 67.66, "elapsed_time": "1 day, 4:43:14", "remaining_time": "13:43:34"} +{"current_steps": 4789, "total_steps": 7063, "loss": 0.0036, "reward": -0.2612, "learning_rate": 1.9274589395981937e-06, "epoch": 0.68, "percentage": 67.8, "elapsed_time": "1 day, 4:46:46", "remaining_time": "13:39:56"} +{"current_steps": 4799, "total_steps": 7063, "loss": 0.0031, "reward": -0.1949, "learning_rate": 1.8577779235764249e-06, "epoch": 0.68, "percentage": 67.95, "elapsed_time": "1 day, 4:50:16", "remaining_time": "13:36:17"} +{"current_steps": 4809, "total_steps": 7063, "loss": 0.0033, "reward": -0.1398, "learning_rate": 1.7890912678378392e-06, "epoch": 0.68, "percentage": 68.09, "elapsed_time": "1 day, 4:53:49", "remaining_time": "13:32:39"} +{"current_steps": 4819, "total_steps": 7063, "loss": 0.0032, "reward": -0.1068, "learning_rate": 1.7214207083644098e-06, "epoch": 0.68, "percentage": 68.23, "elapsed_time": "1 day, 4:57:23", "remaining_time": "13:29:01"} +{"current_steps": 4829, "total_steps": 7063, "loss": 0.0028, "reward": -0.2427, "learning_rate": 1.6547876595931444e-06, "epoch": 0.68, "percentage": 68.37, "elapsed_time": "1 day, 5:01:03", "remaining_time": "13:25:27"} +{"current_steps": 4839, "total_steps": 7063, "loss": 0.0031, "reward": -0.0524, "learning_rate": 1.5892132076394151e-06, "epoch": 0.69, "percentage": 68.51, "elapsed_time": "1 day, 5:04:35", "remaining_time": "13:21:48"} +{"current_steps": 4849, "total_steps": 7063, "loss": 0.0029, "reward": -0.1146, "learning_rate": 1.524718103624252e-06, "epoch": 0.69, "percentage": 68.65, "elapsed_time": "1 day, 5:08:21", "remaining_time": "13:18:16"} +{"current_steps": 4859, "total_steps": 7063, "loss": 0.0029, "reward": -0.1041, "learning_rate": 1.4613227571076138e-06, "epoch": 0.69, "percentage": 68.8, "elapsed_time": "1 day, 5:12:05", "remaining_time": "13:14:43"} +{"current_steps": 4869, "total_steps": 7063, "loss": 0.0025, "reward": -0.2616, "learning_rate": 1.3990472296297808e-06, "epoch": 0.69, "percentage": 68.94, "elapsed_time": "1 day, 5:15:48", "remaining_time": "13:11:10"} +{"current_steps": 4879, "total_steps": 7063, "loss": 0.0029, "reward": -0.187, "learning_rate": 1.3379112283628081e-06, "epoch": 0.69, "percentage": 69.08, "elapsed_time": "1 day, 5:19:21", "remaining_time": "13:07:32"} +{"current_steps": 4889, "total_steps": 7063, "loss": 0.0032, "reward": -0.1955, "learning_rate": 1.2779340998742185e-06, "epoch": 0.69, "percentage": 69.22, "elapsed_time": "1 day, 5:22:54", "remaining_time": "13:03:54"} +{"current_steps": 4899, "total_steps": 7063, "loss": 0.0028, "reward": -0.106, "learning_rate": 1.219134824004704e-06, "epoch": 0.69, "percentage": 69.36, "elapsed_time": "1 day, 5:26:26", "remaining_time": "13:00:16"} +{"current_steps": 4909, "total_steps": 7063, "loss": 0.0032, "reward": -0.2001, "learning_rate": 1.16153200786198e-06, "epoch": 0.7, "percentage": 69.5, "elapsed_time": "1 day, 5:29:57", "remaining_time": "12:56:37"} +{"current_steps": 4919, "total_steps": 7063, "loss": 0.0029, "reward": -0.1302, "learning_rate": 1.1051438799324999e-06, "epoch": 0.7, "percentage": 69.64, "elapsed_time": "1 day, 5:33:40", "remaining_time": "12:53:04"} +{"current_steps": 4929, "total_steps": 7063, "loss": 0.0032, "reward": -0.2308, "learning_rate": 1.0499882843130487e-06, "epoch": 0.7, "percentage": 69.79, "elapsed_time": "1 day, 5:37:09", "remaining_time": "12:49:25"} +{"current_steps": 4939, "total_steps": 7063, "loss": 0.0028, "reward": -0.2366, "learning_rate": 9.96082675063948e-07, "epoch": 0.7, "percentage": 69.93, "elapsed_time": "1 day, 5:40:48", "remaining_time": "12:45:49"} +{"current_steps": 4949, "total_steps": 7063, "loss": 0.003, "reward": -0.1516, "learning_rate": 9.43444110685714e-07, "epoch": 0.7, "percentage": 70.07, "elapsed_time": "1 day, 5:44:26", "remaining_time": "12:42:14"} +{"current_steps": 4959, "total_steps": 7063, "loss": 0.0034, "reward": 0.0169, "learning_rate": 8.920892487208343e-07, "epoch": 0.7, "percentage": 70.21, "elapsed_time": "1 day, 5:47:51", "remaining_time": "12:38:33"} +{"current_steps": 4969, "total_steps": 7063, "loss": 0.0026, "reward": -0.0979, "learning_rate": 8.420343404825132e-07, "epoch": 0.7, "percentage": 70.35, "elapsed_time": "1 day, 5:51:30", "remaining_time": "12:34:57"} +{"current_steps": 4979, "total_steps": 7063, "loss": 0.003, "reward": -0.1379, "learning_rate": 7.932952259118776e-07, "epoch": 0.7, "percentage": 70.49, "elapsed_time": "1 day, 5:55:18", "remaining_time": "12:31:26"} +{"current_steps": 4989, "total_steps": 7063, "loss": 0.0035, "reward": -0.0396, "learning_rate": 7.458873285654489e-07, "epoch": 0.71, "percentage": 70.64, "elapsed_time": "1 day, 5:58:57", "remaining_time": "12:27:51"} +{"current_steps": 4999, "total_steps": 7063, "loss": 0.0027, "reward": 0.0041, "learning_rate": 6.998256507343016e-07, "epoch": 0.71, "percentage": 70.78, "elapsed_time": "1 day, 6:02:36", "remaining_time": "12:24:16"} +{"current_steps": 5009, "total_steps": 7063, "loss": 0.0034, "reward": -0.1662, "learning_rate": 6.551247686965872e-07, "epoch": 0.71, "percentage": 70.92, "elapsed_time": "1 day, 6:06:04", "remaining_time": "12:20:35"} +{"current_steps": 5019, "total_steps": 7063, "loss": 0.0032, "reward": -0.1413, "learning_rate": 6.117988281048626e-07, "epoch": 0.71, "percentage": 71.06, "elapsed_time": "1 day, 6:09:49", "remaining_time": "12:17:03"} +{"current_steps": 5029, "total_steps": 7063, "loss": 0.0029, "reward": -0.2091, "learning_rate": 5.698615395096485e-07, "epoch": 0.71, "percentage": 71.2, "elapsed_time": "1 day, 6:13:19", "remaining_time": "12:13:24"} +{"current_steps": 5039, "total_steps": 7063, "loss": 0.0028, "reward": -0.2433, "learning_rate": 5.293261740207456e-07, "epoch": 0.71, "percentage": 71.34, "elapsed_time": "1 day, 6:17:17", "remaining_time": "12:09:56"} +{"current_steps": 5049, "total_steps": 7063, "loss": 0.0031, "reward": -0.2965, "learning_rate": 4.902055591075355e-07, "epoch": 0.71, "percentage": 71.49, "elapsed_time": "1 day, 6:21:03", "remaining_time": "12:06:24"} +{"current_steps": 5059, "total_steps": 7063, "loss": 0.0029, "reward": -0.1276, "learning_rate": 4.525120745397493e-07, "epoch": 0.72, "percentage": 71.63, "elapsed_time": "1 day, 6:24:46", "remaining_time": "12:02:50"} +{"current_steps": 5069, "total_steps": 7063, "loss": 0.0031, "reward": -0.1481, "learning_rate": 4.1625764846984276e-07, "epoch": 0.72, "percentage": 71.77, "elapsed_time": "1 day, 6:28:37", "remaining_time": "11:59:19"} +{"current_steps": 5079, "total_steps": 7063, "loss": 0.0028, "reward": -0.1388, "learning_rate": 3.814537536583318e-07, "epoch": 0.72, "percentage": 71.91, "elapsed_time": "1 day, 6:32:20", "remaining_time": "11:55:45"} +{"current_steps": 5089, "total_steps": 7063, "loss": 0.003, "reward": -0.2624, "learning_rate": 3.481114038432176e-07, "epoch": 0.72, "percentage": 72.05, "elapsed_time": "1 day, 6:35:52", "remaining_time": "11:52:07"} +{"current_steps": 5099, "total_steps": 7063, "loss": 0.0029, "reward": -0.0321, "learning_rate": 3.1624115025468695e-07, "epoch": 0.72, "percentage": 72.19, "elapsed_time": "1 day, 6:39:37", "remaining_time": "11:48:34"} +{"current_steps": 5109, "total_steps": 7063, "loss": 0.0029, "reward": -0.2161, "learning_rate": 2.8585307827613764e-07, "epoch": 0.72, "percentage": 72.33, "elapsed_time": "1 day, 6:43:04", "remaining_time": "11:44:54"} +{"current_steps": 5119, "total_steps": 7063, "loss": 0.0035, "reward": -0.2493, "learning_rate": 2.569568042526721e-07, "epoch": 0.72, "percentage": 72.48, "elapsed_time": "1 day, 6:46:47", "remaining_time": "11:41:20"} +{"current_steps": 5129, "total_steps": 7063, "loss": 0.0031, "reward": -0.1123, "learning_rate": 2.2956147244796946e-07, "epoch": 0.73, "percentage": 72.62, "elapsed_time": "1 day, 6:50:12", "remaining_time": "11:37:39"} +{"current_steps": 5139, "total_steps": 7063, "loss": 0.0031, "reward": -0.1892, "learning_rate": 2.0367575215059222e-07, "epoch": 0.73, "percentage": 72.76, "elapsed_time": "1 day, 6:53:57", "remaining_time": "11:34:06"} +{"current_steps": 5149, "total_steps": 7063, "loss": 0.0031, "reward": -0.3653, "learning_rate": 1.7930783493055936e-07, "epoch": 0.73, "percentage": 72.9, "elapsed_time": "1 day, 6:57:36", "remaining_time": "11:30:30"} +{"current_steps": 5159, "total_steps": 7063, "loss": 0.003, "reward": -0.1532, "learning_rate": 1.5646543204712595e-07, "epoch": 0.73, "percentage": 73.04, "elapsed_time": "1 day, 7:01:09", "remaining_time": "11:26:53"} +{"current_steps": 5169, "total_steps": 7063, "loss": 0.0031, "reward": -0.2271, "learning_rate": 1.3515577200853946e-07, "epoch": 0.73, "percentage": 73.18, "elapsed_time": "1 day, 7:04:49", "remaining_time": "11:23:18"} +{"current_steps": 5179, "total_steps": 7063, "loss": 0.0033, "reward": -0.1938, "learning_rate": 1.1538559828457586e-07, "epoch": 0.73, "percentage": 73.33, "elapsed_time": "1 day, 7:08:24", "remaining_time": "11:19:41"} +{"current_steps": 5189, "total_steps": 7063, "loss": 0.003, "reward": -0.2875, "learning_rate": 9.716116717254698e-08, "epoch": 0.73, "percentage": 73.47, "elapsed_time": "1 day, 7:11:57", "remaining_time": "11:16:03"} +{"current_steps": 5199, "total_steps": 7063, "loss": 0.0032, "reward": -0.1349, "learning_rate": 8.048824581750325e-08, "epoch": 0.74, "percentage": 73.61, "elapsed_time": "1 day, 7:15:29", "remaining_time": "11:12:25"} +{"current_steps": 5209, "total_steps": 7063, "loss": 0.0027, "reward": -0.1755, "learning_rate": 6.537211038719571e-08, "epoch": 0.74, "percentage": 73.75, "elapsed_time": "1 day, 7:19:06", "remaining_time": "11:08:49"} +{"current_steps": 5219, "total_steps": 7063, "loss": 0.0033, "reward": -0.1694, "learning_rate": 5.1817544402442686e-08, "epoch": 0.74, "percentage": 73.89, "elapsed_time": "1 day, 7:22:33", "remaining_time": "11:05:09"} +{"current_steps": 5229, "total_steps": 7063, "loss": 0.0027, "reward": -0.1913, "learning_rate": 3.9828837223365166e-08, "epoch": 0.74, "percentage": 74.03, "elapsed_time": "1 day, 7:26:15", "remaining_time": "11:01:34"} +{"current_steps": 5239, "total_steps": 7063, "loss": 0.0032, "reward": -0.2301, "learning_rate": 2.9409782692019218e-08, "epoch": 0.74, "percentage": 74.18, "elapsed_time": "1 day, 7:29:59", "remaining_time": "10:58:01"} +{"current_steps": 5249, "total_steps": 7063, "loss": 0.0032, "reward": -0.3049, "learning_rate": 2.056367793183134e-08, "epoch": 0.74, "percentage": 74.32, "elapsed_time": "1 day, 7:33:35", "remaining_time": "10:54:24"} +{"current_steps": 5259, "total_steps": 7063, "loss": 0.0034, "reward": -0.2132, "learning_rate": 1.3293322304213652e-08, "epoch": 0.74, "percentage": 74.46, "elapsed_time": "1 day, 7:37:12", "remaining_time": "10:50:48"} +{"current_steps": 5269, "total_steps": 7063, "loss": 0.0031, "reward": -0.2705, "learning_rate": 7.601016522708616e-09, "epoch": 0.75, "percentage": 74.6, "elapsed_time": "1 day, 7:40:46", "remaining_time": "10:47:10"} +{"current_steps": 5279, "total_steps": 7063, "loss": 0.0031, "reward": -0.1178, "learning_rate": 3.4885619249203086e-09, "epoch": 0.75, "percentage": 74.74, "elapsed_time": "1 day, 7:44:26", "remaining_time": "10:43:35"} +{"current_steps": 5289, "total_steps": 7063, "loss": 0.0031, "reward": -0.1919, "learning_rate": 9.572599024820773e-10, "epoch": 0.75, "percentage": 74.88, "elapsed_time": "1 day, 7:48:05", "remaining_time": "10:40:00"} +{"current_steps": 5299, "total_steps": 7063, "loss": 0.0029, "reward": -0.0784, "learning_rate": 7.911489227074853e-12, "epoch": 0.75, "percentage": 75.02, "elapsed_time": "1 day, 7:51:37", "remaining_time": "10:36:21"} +{"current_steps": 5309, "total_steps": 7063, "loss": 0.0031, "reward": -0.1285, "learning_rate": 6.408171077015856e-10, "epoch": 0.75, "percentage": 75.17, "elapsed_time": "1 day, 7:55:10", "remaining_time": "10:32:44"} +{"current_steps": 5319, "total_steps": 7063, "loss": 0.0031, "reward": -0.1184, "learning_rate": 2.8557764740955172e-09, "epoch": 0.75, "percentage": 75.31, "elapsed_time": "1 day, 7:58:42", "remaining_time": "10:29:06"} +{"current_steps": 5329, "total_steps": 7063, "loss": 0.003, "reward": -0.2125, "learning_rate": 6.652088661621703e-09, "epoch": 0.75, "percentage": 75.45, "elapsed_time": "1 day, 8:02:17", "remaining_time": "10:25:29"} +{"current_steps": 5339, "total_steps": 7063, "loss": 0.004, "reward": -0.202, "learning_rate": 1.2028552322327358e-08, "epoch": 0.76, "percentage": 75.59, "elapsed_time": "1 day, 8:05:58", "remaining_time": "10:21:54"} +{"current_steps": 5349, "total_steps": 7063, "loss": 0.0032, "reward": -0.206, "learning_rate": 1.898346606725887e-08, "epoch": 0.76, "percentage": 75.73, "elapsed_time": "1 day, 8:09:29", "remaining_time": "10:18:16"} +{"current_steps": 5359, "total_steps": 7063, "loss": 0.0033, "reward": -0.2027, "learning_rate": 2.7514629004871673e-08, "epoch": 0.76, "percentage": 75.87, "elapsed_time": "1 day, 8:13:01", "remaining_time": "10:14:38"} +{"current_steps": 5369, "total_steps": 7063, "loss": 0.0044, "reward": -0.2893, "learning_rate": 3.761934143750256e-08, "epoch": 0.76, "percentage": 76.02, "elapsed_time": "1 day, 8:16:35", "remaining_time": "10:11:01"} +{"current_steps": 5379, "total_steps": 7063, "loss": 0.0032, "reward": -0.1786, "learning_rate": 4.9294405715696324e-08, "epoch": 0.76, "percentage": 76.16, "elapsed_time": "1 day, 8:20:13", "remaining_time": "10:07:25"} +{"current_steps": 5389, "total_steps": 7063, "loss": 0.0033, "reward": -0.26, "learning_rate": 6.253612725009962e-08, "epoch": 0.76, "percentage": 76.3, "elapsed_time": "1 day, 8:23:52", "remaining_time": "10:03:49"} +{"current_steps": 5399, "total_steps": 7063, "loss": 0.0024, "reward": -0.2568, "learning_rate": 7.734031568062683e-08, "epoch": 0.76, "percentage": 76.44, "elapsed_time": "1 day, 8:27:29", "remaining_time": "10:00:13"} +{"current_steps": 5409, "total_steps": 7063, "loss": 0.0037, "reward": -0.1439, "learning_rate": 9.370228620249778e-08, "epoch": 0.77, "percentage": 76.58, "elapsed_time": "1 day, 8:31:02", "remaining_time": "9:56:36"} +{"current_steps": 5419, "total_steps": 7063, "loss": 0.0028, "reward": -0.2807, "learning_rate": 1.116168610487578e-07, "epoch": 0.77, "percentage": 76.72, "elapsed_time": "1 day, 8:34:35", "remaining_time": "9:52:58"} +{"current_steps": 5429, "total_steps": 7063, "loss": 0.0032, "reward": -0.2143, "learning_rate": 1.3107837112877664e-07, "epoch": 0.77, "percentage": 76.87, "elapsed_time": "1 day, 8:38:12", "remaining_time": "9:49:22"} +{"current_steps": 5439, "total_steps": 7063, "loss": 0.0031, "reward": -0.2846, "learning_rate": 1.5208065782225667e-07, "epoch": 0.77, "percentage": 77.01, "elapsed_time": "1 day, 8:41:52", "remaining_time": "9:45:47"} +{"current_steps": 5449, "total_steps": 7063, "loss": 0.0032, "reward": -0.2704, "learning_rate": 1.7461707492811786e-07, "epoch": 0.77, "percentage": 77.15, "elapsed_time": "1 day, 8:45:29", "remaining_time": "9:42:10"} +{"current_steps": 5459, "total_steps": 7063, "loss": 0.0035, "reward": -0.2247, "learning_rate": 1.9868049076771478e-07, "epoch": 0.77, "percentage": 77.29, "elapsed_time": "1 day, 8:49:08", "remaining_time": "9:38:35"} +{"current_steps": 5469, "total_steps": 7063, "loss": 0.0032, "reward": -0.1316, "learning_rate": 2.2426329044164808e-07, "epoch": 0.77, "percentage": 77.43, "elapsed_time": "1 day, 8:52:39", "remaining_time": "9:34:57"} +{"current_steps": 5479, "total_steps": 7063, "loss": 0.0033, "reward": -0.1427, "learning_rate": 2.5135737823952457e-07, "epoch": 0.78, "percentage": 77.57, "elapsed_time": "1 day, 8:56:15", "remaining_time": "9:31:20"} +{"current_steps": 5489, "total_steps": 7063, "loss": 0.0029, "reward": -0.2073, "learning_rate": 2.7995418020185016e-07, "epoch": 0.78, "percentage": 77.71, "elapsed_time": "1 day, 9:00:04", "remaining_time": "9:27:47"} +{"current_steps": 5499, "total_steps": 7063, "loss": 0.0026, "reward": -0.1949, "learning_rate": 3.100446468332596e-07, "epoch": 0.78, "percentage": 77.86, "elapsed_time": "1 day, 9:03:41", "remaining_time": "9:24:11"} +{"current_steps": 5509, "total_steps": 7063, "loss": 0.0028, "reward": -0.2821, "learning_rate": 3.41619255966264e-07, "epoch": 0.78, "percentage": 78.0, "elapsed_time": "1 day, 9:07:15", "remaining_time": "9:20:34"} +{"current_steps": 5519, "total_steps": 7063, "loss": 0.0029, "reward": -0.1413, "learning_rate": 3.746680157745258e-07, "epoch": 0.78, "percentage": 78.14, "elapsed_time": "1 day, 9:10:54", "remaining_time": "9:16:58"} +{"current_steps": 5529, "total_steps": 7063, "loss": 0.0032, "reward": -0.2282, "learning_rate": 4.091804679348144e-07, "epoch": 0.78, "percentage": 78.28, "elapsed_time": "1 day, 9:14:29", "remaining_time": "9:13:21"} +{"current_steps": 5539, "total_steps": 7063, "loss": 0.003, "reward": -0.1473, "learning_rate": 4.451456909365265e-07, "epoch": 0.78, "percentage": 78.42, "elapsed_time": "1 day, 9:18:05", "remaining_time": "9:09:45"} +{"current_steps": 5549, "total_steps": 7063, "loss": 0.0032, "reward": -0.1949, "learning_rate": 4.825523035378365e-07, "epoch": 0.79, "percentage": 78.56, "elapsed_time": "1 day, 9:21:44", "remaining_time": "9:06:09"} +{"current_steps": 5559, "total_steps": 7063, "loss": 0.0041, "reward": -0.0118, "learning_rate": 5.213884683672954e-07, "epoch": 0.79, "percentage": 78.71, "elapsed_time": "1 day, 9:25:11", "remaining_time": "9:02:30"} +{"current_steps": 5569, "total_steps": 7063, "loss": 0.0031, "reward": -0.1958, "learning_rate": 5.61641895669785e-07, "epoch": 0.79, "percentage": 78.85, "elapsed_time": "1 day, 9:28:51", "remaining_time": "8:58:55"} +{"current_steps": 5579, "total_steps": 7063, "loss": 0.003, "reward": -0.0907, "learning_rate": 6.03299847195613e-07, "epoch": 0.79, "percentage": 78.99, "elapsed_time": "1 day, 9:32:32", "remaining_time": "8:55:19"} +{"current_steps": 5589, "total_steps": 7063, "loss": 0.0032, "reward": -0.1633, "learning_rate": 6.46349140231578e-07, "epoch": 0.79, "percentage": 79.13, "elapsed_time": "1 day, 9:36:10", "remaining_time": "8:51:43"} +{"current_steps": 5599, "total_steps": 7063, "loss": 0.0037, "reward": -0.3335, "learning_rate": 6.907761517726225e-07, "epoch": 0.79, "percentage": 79.27, "elapsed_time": "1 day, 9:39:46", "remaining_time": "8:48:07"} +{"current_steps": 5609, "total_steps": 7063, "loss": 0.0032, "reward": -0.2729, "learning_rate": 7.365668228328832e-07, "epoch": 0.79, "percentage": 79.41, "elapsed_time": "1 day, 9:43:26", "remaining_time": "8:44:31"} +{"current_steps": 5619, "total_steps": 7063, "loss": 0.004, "reward": -0.2201, "learning_rate": 7.837066628946427e-07, "epoch": 0.8, "percentage": 79.56, "elapsed_time": "1 day, 9:46:54", "remaining_time": "8:40:53"} +{"current_steps": 5629, "total_steps": 7063, "loss": 0.0035, "reward": -0.1243, "learning_rate": 8.321807544939037e-07, "epoch": 0.8, "percentage": 79.7, "elapsed_time": "1 day, 9:50:22", "remaining_time": "8:37:14"} +{"current_steps": 5639, "total_steps": 7063, "loss": 0.003, "reward": -0.1845, "learning_rate": 8.819737579410198e-07, "epoch": 0.8, "percentage": 79.84, "elapsed_time": "1 day, 9:53:58", "remaining_time": "8:33:38"} +{"current_steps": 5649, "total_steps": 7063, "loss": 0.0032, "reward": -0.2037, "learning_rate": 9.33069916174974e-07, "epoch": 0.8, "percentage": 79.98, "elapsed_time": "1 day, 9:57:27", "remaining_time": "8:29:59"} +{"current_steps": 5659, "total_steps": 7063, "loss": 0.0031, "reward": -0.0922, "learning_rate": 9.854530597496953e-07, "epoch": 0.8, "percentage": 80.12, "elapsed_time": "1 day, 10:00:58", "remaining_time": "8:26:21"} +{"current_steps": 5669, "total_steps": 7063, "loss": 0.0025, "reward": -0.2618, "learning_rate": 1.039106611950943e-06, "epoch": 0.8, "percentage": 80.26, "elapsed_time": "1 day, 10:04:45", "remaining_time": "8:22:48"} +{"current_steps": 5679, "total_steps": 7063, "loss": 0.003, "reward": -0.1229, "learning_rate": 1.0940135940419828e-06, "epoch": 0.8, "percentage": 80.4, "elapsed_time": "1 day, 10:08:19", "remaining_time": "8:19:11"} +{"current_steps": 5689, "total_steps": 7063, "loss": 0.0029, "reward": -0.0647, "learning_rate": 1.1501566306365758e-06, "epoch": 0.81, "percentage": 80.55, "elapsed_time": "1 day, 10:12:08", "remaining_time": "8:15:37"} +{"current_steps": 5699, "total_steps": 7063, "loss": 0.003, "reward": -0.1913, "learning_rate": 1.2075179551973986e-06, "epoch": 0.81, "percentage": 80.69, "elapsed_time": "1 day, 10:15:48", "remaining_time": "8:12:02"} +{"current_steps": 5709, "total_steps": 7063, "loss": 0.0028, "reward": -0.1541, "learning_rate": 1.2660794156583233e-06, "epoch": 0.81, "percentage": 80.83, "elapsed_time": "1 day, 10:19:21", "remaining_time": "8:08:24"} +{"current_steps": 5719, "total_steps": 7063, "loss": 0.0033, "reward": -0.1554, "learning_rate": 1.3258224801686503e-06, "epoch": 0.81, "percentage": 80.97, "elapsed_time": "1 day, 10:22:44", "remaining_time": "8:04:45"} +{"current_steps": 5729, "total_steps": 7063, "loss": 0.0041, "reward": -0.3137, "learning_rate": 1.3867282429575152e-06, "epoch": 0.81, "percentage": 81.11, "elapsed_time": "1 day, 10:26:21", "remaining_time": "8:01:09"} +{"current_steps": 5739, "total_steps": 7063, "loss": 0.0033, "reward": -0.2465, "learning_rate": 1.4487774303166875e-06, "epoch": 0.81, "percentage": 81.25, "elapsed_time": "1 day, 10:30:06", "remaining_time": "7:57:34"} +{"current_steps": 5749, "total_steps": 7063, "loss": 0.0038, "reward": -0.2697, "learning_rate": 1.511950406699712e-06, "epoch": 0.81, "percentage": 81.4, "elapsed_time": "1 day, 10:33:40", "remaining_time": "7:53:57"} +{"current_steps": 5759, "total_steps": 7063, "loss": 0.0032, "reward": -0.155, "learning_rate": 1.576227180935655e-06, "epoch": 0.82, "percentage": 81.54, "elapsed_time": "1 day, 10:37:15", "remaining_time": "7:50:20"} +{"current_steps": 5769, "total_steps": 7063, "loss": 0.0026, "reward": -0.128, "learning_rate": 1.641587412555281e-06, "epoch": 0.82, "percentage": 81.68, "elapsed_time": "1 day, 10:40:55", "remaining_time": "7:46:45"} +{"current_steps": 5779, "total_steps": 7063, "loss": 0.0036, "reward": -0.1322, "learning_rate": 1.7080104182278716e-06, "epoch": 0.82, "percentage": 81.82, "elapsed_time": "1 day, 10:44:27", "remaining_time": "7:43:08"} +{"current_steps": 5789, "total_steps": 7063, "loss": 0.0036, "reward": -0.2405, "learning_rate": 1.7754751783064622e-06, "epoch": 0.82, "percentage": 81.96, "elapsed_time": "1 day, 10:47:59", "remaining_time": "7:39:30"} +{"current_steps": 5799, "total_steps": 7063, "loss": 0.0032, "reward": -0.1742, "learning_rate": 1.8439603434795516e-06, "epoch": 0.82, "percentage": 82.1, "elapsed_time": "1 day, 10:51:28", "remaining_time": "7:35:52"} +{"current_steps": 5809, "total_steps": 7063, "loss": 0.003, "reward": -0.1415, "learning_rate": 1.9134442415270926e-06, "epoch": 0.82, "percentage": 82.25, "elapsed_time": "1 day, 10:55:00", "remaining_time": "7:32:15"} +{"current_steps": 5819, "total_steps": 7063, "loss": 0.0027, "reward": -0.3485, "learning_rate": 1.983904884178742e-06, "epoch": 0.82, "percentage": 82.39, "elapsed_time": "1 day, 10:58:48", "remaining_time": "7:28:41"} +{"current_steps": 5829, "total_steps": 7063, "loss": 0.0033, "reward": -0.2301, "learning_rate": 2.0553199740720214e-06, "epoch": 0.83, "percentage": 82.53, "elapsed_time": "1 day, 11:02:19", "remaining_time": "7:25:03"} +{"current_steps": 5839, "total_steps": 7063, "loss": 0.0038, "reward": -0.419, "learning_rate": 2.1276669118084043e-06, "epoch": 0.83, "percentage": 82.67, "elapsed_time": "1 day, 11:05:55", "remaining_time": "7:21:27"} +{"current_steps": 5849, "total_steps": 7063, "loss": 0.0028, "reward": -0.1832, "learning_rate": 2.200922803104868e-06, "epoch": 0.83, "percentage": 82.81, "elapsed_time": "1 day, 11:09:24", "remaining_time": "7:17:49"} +{"current_steps": 5859, "total_steps": 7063, "loss": 0.0028, "reward": -0.1299, "learning_rate": 2.2750644660388675e-06, "epoch": 0.83, "percentage": 82.95, "elapsed_time": "1 day, 11:12:56", "remaining_time": "7:14:12"} +{"current_steps": 5869, "total_steps": 7063, "loss": 0.0027, "reward": -0.0986, "learning_rate": 2.3500684383842605e-06, "epoch": 0.83, "percentage": 83.1, "elapsed_time": "1 day, 11:16:39", "remaining_time": "7:10:37"} +{"current_steps": 5879, "total_steps": 7063, "loss": 0.0027, "reward": -0.1309, "learning_rate": 2.4259109850359695e-06, "epoch": 0.83, "percentage": 83.24, "elapsed_time": "1 day, 11:20:15", "remaining_time": "7:07:00"} +{"current_steps": 5889, "total_steps": 7063, "loss": 0.0034, "reward": -0.1672, "learning_rate": 2.502568105520961e-06, "epoch": 0.83, "percentage": 83.38, "elapsed_time": "1 day, 11:23:55", "remaining_time": "7:03:24"} +{"current_steps": 5899, "total_steps": 7063, "loss": 0.0031, "reward": -0.1751, "learning_rate": 2.580015541593277e-06, "epoch": 0.84, "percentage": 83.52, "elapsed_time": "1 day, 11:27:35", "remaining_time": "6:59:49"} +{"current_steps": 5909, "total_steps": 7063, "loss": 0.0031, "reward": -0.2151, "learning_rate": 2.6582287849105274e-06, "epoch": 0.84, "percentage": 83.66, "elapsed_time": "1 day, 11:31:11", "remaining_time": "6:56:12"} +{"current_steps": 5919, "total_steps": 7063, "loss": 0.0029, "reward": -0.1455, "learning_rate": 2.737183084789651e-06, "epoch": 0.84, "percentage": 83.8, "elapsed_time": "1 day, 11:34:56", "remaining_time": "6:52:38"} +{"current_steps": 5929, "total_steps": 7063, "loss": 0.0026, "reward": -0.1059, "learning_rate": 2.816853456039244e-06, "epoch": 0.84, "percentage": 83.94, "elapsed_time": "1 day, 11:38:43", "remaining_time": "6:49:03"} +{"current_steps": 5939, "total_steps": 7063, "loss": 0.0028, "reward": -0.1925, "learning_rate": 2.8972146868661828e-06, "epoch": 0.84, "percentage": 84.09, "elapsed_time": "1 day, 11:42:19", "remaining_time": "6:45:27"} +{"current_steps": 5949, "total_steps": 7063, "loss": 0.0028, "reward": -0.3239, "learning_rate": 2.9782413468539417e-06, "epoch": 0.84, "percentage": 84.23, "elapsed_time": "1 day, 11:45:53", "remaining_time": "6:41:50"} +{"current_steps": 5959, "total_steps": 7063, "loss": 0.0039, "reward": -0.2807, "learning_rate": 3.0599077950100608e-06, "epoch": 0.84, "percentage": 84.37, "elapsed_time": "1 day, 11:49:21", "remaining_time": "6:38:12"} +{"current_steps": 5969, "total_steps": 7063, "loss": 0.0028, "reward": -0.2573, "learning_rate": 3.1421881878802864e-06, "epoch": 0.85, "percentage": 84.51, "elapsed_time": "1 day, 11:52:53", "remaining_time": "6:34:35"} +{"current_steps": 5979, "total_steps": 7063, "loss": 0.003, "reward": -0.2115, "learning_rate": 3.225056487726732e-06, "epoch": 0.85, "percentage": 84.65, "elapsed_time": "1 day, 11:56:38", "remaining_time": "6:31:00"} +{"current_steps": 5989, "total_steps": 7063, "loss": 0.0028, "reward": -0.1847, "learning_rate": 3.308486470767613e-06, "epoch": 0.85, "percentage": 84.79, "elapsed_time": "1 day, 12:00:14", "remaining_time": "6:27:23"} +{"current_steps": 5999, "total_steps": 7063, "loss": 0.0027, "reward": -0.1512, "learning_rate": 3.3924517354757315e-06, "epoch": 0.85, "percentage": 84.94, "elapsed_time": "1 day, 12:03:53", "remaining_time": "6:23:47"} +{"current_steps": 6009, "total_steps": 7063, "loss": 0.0031, "reward": -0.0941, "learning_rate": 3.476925710933339e-06, "epoch": 0.85, "percentage": 85.08, "elapsed_time": "1 day, 12:07:24", "remaining_time": "6:20:10"} +{"current_steps": 6019, "total_steps": 7063, "loss": 0.0033, "reward": -0.2708, "learning_rate": 3.5618816652404714e-06, "epoch": 0.85, "percentage": 85.22, "elapsed_time": "1 day, 12:10:52", "remaining_time": "6:16:32"} +{"current_steps": 6029, "total_steps": 7063, "loss": 0.0024, "reward": -0.1351, "learning_rate": 3.6472927139743546e-06, "epoch": 0.85, "percentage": 85.36, "elapsed_time": "1 day, 12:14:35", "remaining_time": "6:12:57"} +{"current_steps": 6039, "total_steps": 7063, "loss": 0.003, "reward": -0.2288, "learning_rate": 3.7331318286969787e-06, "epoch": 0.86, "percentage": 85.5, "elapsed_time": "1 day, 12:18:08", "remaining_time": "6:09:20"} +{"current_steps": 6049, "total_steps": 7063, "loss": 0.0025, "reward": -0.1268, "learning_rate": 3.819371845508301e-06, "epoch": 0.86, "percentage": 85.64, "elapsed_time": "1 day, 12:21:49", "remaining_time": "6:05:44"} +{"current_steps": 6059, "total_steps": 7063, "loss": 0.0035, "reward": -0.1775, "learning_rate": 3.9059854736422616e-06, "epoch": 0.86, "percentage": 85.79, "elapsed_time": "1 day, 12:25:12", "remaining_time": "6:02:05"} +{"current_steps": 6069, "total_steps": 7063, "loss": 0.0029, "reward": -0.1164, "learning_rate": 3.992945304103046e-06, "epoch": 0.86, "percentage": 85.93, "elapsed_time": "1 day, 12:28:50", "remaining_time": "5:58:29"} +{"current_steps": 6079, "total_steps": 7063, "loss": 0.003, "reward": -0.3306, "learning_rate": 4.080223818338627e-06, "epoch": 0.86, "percentage": 86.07, "elapsed_time": "1 day, 12:32:23", "remaining_time": "5:54:52"} +{"current_steps": 6089, "total_steps": 7063, "loss": 0.0029, "reward": -0.124, "learning_rate": 4.16779339694911e-06, "epoch": 0.86, "percentage": 86.21, "elapsed_time": "1 day, 12:36:03", "remaining_time": "5:51:16"} +{"current_steps": 6099, "total_steps": 7063, "loss": 0.0029, "reward": -0.1823, "learning_rate": 4.25562632842687e-06, "epoch": 0.86, "percentage": 86.35, "elapsed_time": "1 day, 12:39:40", "remaining_time": "5:47:40"} +{"current_steps": 6109, "total_steps": 7063, "loss": 0.0026, "reward": -0.2144, "learning_rate": 4.343694817925945e-06, "epoch": 0.86, "percentage": 86.49, "elapsed_time": "1 day, 12:43:14", "remaining_time": "5:44:03"} +{"current_steps": 6119, "total_steps": 7063, "loss": 0.0028, "reward": -0.0664, "learning_rate": 4.4319709960577205e-06, "epoch": 0.87, "percentage": 86.63, "elapsed_time": "1 day, 12:46:53", "remaining_time": "5:40:27"} +{"current_steps": 6129, "total_steps": 7063, "loss": 0.0027, "reward": -0.1177, "learning_rate": 4.520426927710255e-06, "epoch": 0.87, "percentage": 86.78, "elapsed_time": "1 day, 12:50:27", "remaining_time": "5:36:51"} +{"current_steps": 6139, "total_steps": 7063, "loss": 0.0034, "reward": -0.135, "learning_rate": 4.609034620888349e-06, "epoch": 0.87, "percentage": 86.92, "elapsed_time": "1 day, 12:53:54", "remaining_time": "5:33:13"} +{"current_steps": 6149, "total_steps": 7063, "loss": 0.0043, "reward": -0.3131, "learning_rate": 4.697766035571671e-06, "epoch": 0.87, "percentage": 87.06, "elapsed_time": "1 day, 12:57:30", "remaining_time": "5:29:36"} +{"current_steps": 6159, "total_steps": 7063, "loss": 0.0024, "reward": -0.234, "learning_rate": 4.786593092588086e-06, "epoch": 0.87, "percentage": 87.2, "elapsed_time": "1 day, 13:01:13", "remaining_time": "5:26:01"} +{"current_steps": 6169, "total_steps": 7063, "loss": 0.0027, "reward": -0.0573, "learning_rate": 4.875487682499278e-06, "epoch": 0.87, "percentage": 87.34, "elapsed_time": "1 day, 13:04:47", "remaining_time": "5:22:24"} +{"current_steps": 6179, "total_steps": 7063, "loss": 0.0034, "reward": -0.1771, "learning_rate": 4.96442167449609e-06, "epoch": 0.87, "percentage": 87.48, "elapsed_time": "1 day, 13:08:23", "remaining_time": "5:18:48"} +{"current_steps": 6189, "total_steps": 7063, "loss": 0.0028, "reward": -0.1481, "learning_rate": 5.053366925300511e-06, "epoch": 0.88, "percentage": 87.63, "elapsed_time": "1 day, 13:11:58", "remaining_time": "5:15:11"} +{"current_steps": 6199, "total_steps": 7063, "loss": 0.0041, "reward": -0.2635, "learning_rate": 5.142295288071675e-06, "epoch": 0.88, "percentage": 87.77, "elapsed_time": "1 day, 13:15:33", "remaining_time": "5:11:35"} +{"current_steps": 6209, "total_steps": 7063, "loss": 0.003, "reward": -0.1914, "learning_rate": 5.2311786213129315e-06, "epoch": 0.88, "percentage": 87.91, "elapsed_time": "1 day, 13:19:07", "remaining_time": "5:07:58"} +{"current_steps": 6219, "total_steps": 7063, "loss": 0.0027, "reward": -0.181, "learning_rate": 5.319988797777316e-06, "epoch": 0.88, "percentage": 88.05, "elapsed_time": "1 day, 13:22:43", "remaining_time": "5:04:22"} +{"current_steps": 6229, "total_steps": 7063, "loss": 0.0028, "reward": -0.1659, "learning_rate": 5.408697713368388e-06, "epoch": 0.88, "percentage": 88.19, "elapsed_time": "1 day, 13:26:29", "remaining_time": "5:00:46"} +{"current_steps": 6239, "total_steps": 7063, "loss": 0.0024, "reward": -0.0837, "learning_rate": 5.4972772960338784e-06, "epoch": 0.88, "percentage": 88.33, "elapsed_time": "1 day, 13:30:08", "remaining_time": "4:57:10"} +{"current_steps": 6249, "total_steps": 7063, "loss": 0.003, "reward": -0.1156, "learning_rate": 5.585699514649057e-06, "epoch": 0.88, "percentage": 88.48, "elapsed_time": "1 day, 13:33:51", "remaining_time": "4:53:35"} +{"current_steps": 6259, "total_steps": 7063, "loss": 0.003, "reward": -0.1918, "learning_rate": 5.6739363878872754e-06, "epoch": 0.89, "percentage": 88.62, "elapsed_time": "1 day, 13:37:31", "remaining_time": "4:49:59"} +{"current_steps": 6269, "total_steps": 7063, "loss": 0.0027, "reward": -0.2119, "learning_rate": 5.761959993074669e-06, "epoch": 0.89, "percentage": 88.76, "elapsed_time": "1 day, 13:41:02", "remaining_time": "4:46:22"} +{"current_steps": 6279, "total_steps": 7063, "loss": 0.0031, "reward": -0.1654, "learning_rate": 5.84974247502633e-06, "epoch": 0.89, "percentage": 88.9, "elapsed_time": "1 day, 13:44:46", "remaining_time": "4:42:46"} +{"current_steps": 6289, "total_steps": 7063, "loss": 0.0029, "reward": -0.1048, "learning_rate": 5.93725605486109e-06, "epoch": 0.89, "percentage": 89.04, "elapsed_time": "1 day, 13:48:23", "remaining_time": "4:39:10"} +{"current_steps": 6299, "total_steps": 7063, "loss": 0.0029, "reward": -0.1743, "learning_rate": 6.024473038792242e-06, "epoch": 0.89, "percentage": 89.18, "elapsed_time": "1 day, 13:51:58", "remaining_time": "4:35:33"} +{"current_steps": 6309, "total_steps": 7063, "loss": 0.0028, "reward": -0.1883, "learning_rate": 6.1113658268912065e-06, "epoch": 0.89, "percentage": 89.32, "elapsed_time": "1 day, 13:55:35", "remaining_time": "4:31:57"} +{"current_steps": 6319, "total_steps": 7063, "loss": 0.0027, "reward": -0.1351, "learning_rate": 6.197906921821632e-06, "epoch": 0.89, "percentage": 89.47, "elapsed_time": "1 day, 13:59:19", "remaining_time": "4:28:22"} +{"current_steps": 6329, "total_steps": 7063, "loss": 0.0027, "reward": -0.1687, "learning_rate": 6.284068937540894e-06, "epoch": 0.9, "percentage": 89.61, "elapsed_time": "1 day, 14:02:56", "remaining_time": "4:24:45"} +{"current_steps": 6339, "total_steps": 7063, "loss": 0.0028, "reward": -0.1027, "learning_rate": 6.369824607966508e-06, "epoch": 0.9, "percentage": 89.75, "elapsed_time": "1 day, 14:06:35", "remaining_time": "4:21:09"} +{"current_steps": 6349, "total_steps": 7063, "loss": 0.0028, "reward": -0.0773, "learning_rate": 6.455146795604479e-06, "epoch": 0.9, "percentage": 89.89, "elapsed_time": "1 day, 14:10:03", "remaining_time": "4:17:32"} +{"current_steps": 6359, "total_steps": 7063, "loss": 0.0025, "reward": -0.2412, "learning_rate": 6.5400085001370186e-06, "epoch": 0.9, "percentage": 90.03, "elapsed_time": "1 day, 14:13:52", "remaining_time": "4:13:57"} +{"current_steps": 6369, "total_steps": 7063, "loss": 0.003, "reward": -0.1633, "learning_rate": 6.624382866966794e-06, "epoch": 0.9, "percentage": 90.17, "elapsed_time": "1 day, 14:17:25", "remaining_time": "4:10:20"} +{"current_steps": 6379, "total_steps": 7063, "loss": 0.0026, "reward": -0.2322, "learning_rate": 6.708243195715136e-06, "epoch": 0.9, "percentage": 90.32, "elapsed_time": "1 day, 14:21:00", "remaining_time": "4:06:43"} +{"current_steps": 6389, "total_steps": 7063, "loss": 0.0032, "reward": -0.1261, "learning_rate": 6.791562948671414e-06, "epoch": 0.9, "percentage": 90.46, "elapsed_time": "1 day, 14:24:39", "remaining_time": "4:03:07"} +{"current_steps": 6399, "total_steps": 7063, "loss": 0.0025, "reward": -0.1441, "learning_rate": 6.874315759190886e-06, "epoch": 0.91, "percentage": 90.6, "elapsed_time": "1 day, 14:28:19", "remaining_time": "3:59:31"} +{"current_steps": 6409, "total_steps": 7063, "loss": 0.0031, "reward": -0.0489, "learning_rate": 6.956475440038507e-06, "epoch": 0.91, "percentage": 90.74, "elapsed_time": "1 day, 14:31:53", "remaining_time": "3:55:54"} +{"current_steps": 6419, "total_steps": 7063, "loss": 0.0028, "reward": -0.1033, "learning_rate": 7.038015991675885e-06, "epoch": 0.91, "percentage": 90.88, "elapsed_time": "1 day, 14:35:26", "remaining_time": "3:52:18"} +{"current_steps": 6429, "total_steps": 7063, "loss": 0.0027, "reward": -0.2106, "learning_rate": 7.118911610488885e-06, "epoch": 0.91, "percentage": 91.02, "elapsed_time": "1 day, 14:39:06", "remaining_time": "3:48:42"} +{"current_steps": 6439, "total_steps": 7063, "loss": 0.0036, "reward": -0.0478, "learning_rate": 7.199136696953178e-06, "epoch": 0.91, "percentage": 91.17, "elapsed_time": "1 day, 14:42:44", "remaining_time": "3:45:05"} +{"current_steps": 6449, "total_steps": 7063, "loss": 0.003, "reward": -0.218, "learning_rate": 7.2786658637353125e-06, "epoch": 0.91, "percentage": 91.31, "elapsed_time": "1 day, 14:46:16", "remaining_time": "3:41:28"} +{"current_steps": 6459, "total_steps": 7063, "loss": 0.0026, "reward": -0.0883, "learning_rate": 7.357473943726493e-06, "epoch": 0.91, "percentage": 91.45, "elapsed_time": "1 day, 14:49:57", "remaining_time": "3:37:52"} +{"current_steps": 6469, "total_steps": 7063, "loss": 0.0034, "reward": -0.2207, "learning_rate": 7.435535998006814e-06, "epoch": 0.92, "percentage": 91.59, "elapsed_time": "1 day, 14:53:29", "remaining_time": "3:34:16"} +{"current_steps": 6479, "total_steps": 7063, "loss": 0.0033, "reward": -0.192, "learning_rate": 7.512827323737152e-06, "epoch": 0.92, "percentage": 91.73, "elapsed_time": "1 day, 14:57:05", "remaining_time": "3:30:39"} +{"current_steps": 6489, "total_steps": 7063, "loss": 0.0028, "reward": -0.1123, "learning_rate": 7.589323461976461e-06, "epoch": 0.92, "percentage": 91.87, "elapsed_time": "1 day, 15:00:44", "remaining_time": "3:27:03"} +{"current_steps": 6499, "total_steps": 7063, "loss": 0.0029, "reward": -0.2671, "learning_rate": 7.665000205421812e-06, "epoch": 0.92, "percentage": 92.01, "elapsed_time": "1 day, 15:04:25", "remaining_time": "3:23:27"} +{"current_steps": 6509, "total_steps": 7063, "loss": 0.0031, "reward": -0.1165, "learning_rate": 7.739833606068832e-06, "epoch": 0.92, "percentage": 92.16, "elapsed_time": "1 day, 15:08:04", "remaining_time": "3:19:51"} +{"current_steps": 6519, "total_steps": 7063, "loss": 0.0029, "reward": -0.1378, "learning_rate": 7.81379998279006e-06, "epoch": 0.92, "percentage": 92.3, "elapsed_time": "1 day, 15:11:44", "remaining_time": "3:16:14"} +{"current_steps": 6529, "total_steps": 7063, "loss": 0.0033, "reward": -0.1337, "learning_rate": 7.88687592882892e-06, "epoch": 0.92, "percentage": 92.44, "elapsed_time": "1 day, 15:15:10", "remaining_time": "3:12:37"} +{"current_steps": 6539, "total_steps": 7063, "loss": 0.0027, "reward": -0.2007, "learning_rate": 7.959038319206758e-06, "epoch": 0.93, "percentage": 92.58, "elapsed_time": "1 day, 15:18:48", "remaining_time": "3:09:01"} +{"current_steps": 6549, "total_steps": 7063, "loss": 0.0026, "reward": -0.1243, "learning_rate": 8.03026431804083e-06, "epoch": 0.93, "percentage": 92.72, "elapsed_time": "1 day, 15:22:25", "remaining_time": "3:05:24"} +{"current_steps": 6559, "total_steps": 7063, "loss": 0.0029, "reward": -0.0918, "learning_rate": 8.100531385770696e-06, "epoch": 0.93, "percentage": 92.86, "elapsed_time": "1 day, 15:26:05", "remaining_time": "3:01:48"} +{"current_steps": 6569, "total_steps": 7063, "loss": 0.0029, "reward": -0.0355, "learning_rate": 8.169817286290935e-06, "epoch": 0.93, "percentage": 93.01, "elapsed_time": "1 day, 15:29:48", "remaining_time": "2:58:12"} +{"current_steps": 6579, "total_steps": 7063, "loss": 0.0027, "reward": -0.2479, "learning_rate": 8.238100093987765e-06, "epoch": 0.93, "percentage": 93.15, "elapsed_time": "1 day, 15:33:31", "remaining_time": "2:54:36"} +{"current_steps": 6589, "total_steps": 7063, "loss": 0.0026, "reward": -0.074, "learning_rate": 8.305358200677449e-06, "epoch": 0.93, "percentage": 93.29, "elapsed_time": "1 day, 15:37:13", "remaining_time": "2:51:00"} +{"current_steps": 6599, "total_steps": 7063, "loss": 0.0029, "reward": -0.0884, "learning_rate": 8.371570322444209e-06, "epoch": 0.93, "percentage": 93.43, "elapsed_time": "1 day, 15:40:52", "remaining_time": "2:47:24"} +{"current_steps": 6609, "total_steps": 7063, "loss": 0.0028, "reward": -0.1674, "learning_rate": 8.436715506375557e-06, "epoch": 0.94, "percentage": 93.57, "elapsed_time": "1 day, 15:44:26", "remaining_time": "2:43:47"} +{"current_steps": 6619, "total_steps": 7063, "loss": 0.0035, "reward": -0.2794, "learning_rate": 8.500773137192906e-06, "epoch": 0.94, "percentage": 93.71, "elapsed_time": "1 day, 15:47:59", "remaining_time": "2:40:11"} +{"current_steps": 6629, "total_steps": 7063, "loss": 0.0027, "reward": -0.1072, "learning_rate": 8.56372294377524e-06, "epoch": 0.94, "percentage": 93.86, "elapsed_time": "1 day, 15:51:37", "remaining_time": "2:36:34"} +{"current_steps": 6639, "total_steps": 7063, "loss": 0.0023, "reward": -0.0992, "learning_rate": 8.625545005574002e-06, "epoch": 0.94, "percentage": 94.0, "elapsed_time": "1 day, 15:55:17", "remaining_time": "2:32:58"} +{"current_steps": 6649, "total_steps": 7063, "loss": 0.0029, "reward": -0.1256, "learning_rate": 8.686219758916918e-06, "epoch": 0.94, "percentage": 94.14, "elapsed_time": "1 day, 15:58:49", "remaining_time": "2:29:21"} +{"current_steps": 6659, "total_steps": 7063, "loss": 0.0039, "reward": 0.0413, "learning_rate": 8.745728003198991e-06, "epoch": 0.94, "percentage": 94.28, "elapsed_time": "1 day, 16:02:22", "remaining_time": "2:25:45"} +{"current_steps": 6669, "total_steps": 7063, "loss": 0.0026, "reward": -0.1593, "learning_rate": 8.804050906958537e-06, "epoch": 0.94, "percentage": 94.42, "elapsed_time": "1 day, 16:05:56", "remaining_time": "2:22:08"} +{"current_steps": 6679, "total_steps": 7063, "loss": 0.0031, "reward": -0.0352, "learning_rate": 8.861170013836436e-06, "epoch": 0.95, "percentage": 94.56, "elapsed_time": "1 day, 16:09:29", "remaining_time": "2:18:31"} +{"current_steps": 6689, "total_steps": 7063, "loss": 0.003, "reward": -0.0722, "learning_rate": 8.917067248416647e-06, "epoch": 0.95, "percentage": 94.7, "elapsed_time": "1 day, 16:13:04", "remaining_time": "2:14:55"} +{"current_steps": 6699, "total_steps": 7063, "loss": 0.0027, "reward": -0.1898, "learning_rate": 8.971724921946235e-06, "epoch": 0.95, "percentage": 94.85, "elapsed_time": "1 day, 16:16:38", "remaining_time": "2:11:18"} +{"current_steps": 6709, "total_steps": 7063, "loss": 0.003, "reward": -0.1166, "learning_rate": 9.025125737932962e-06, "epoch": 0.95, "percentage": 94.99, "elapsed_time": "1 day, 16:20:12", "remaining_time": "2:07:42"} +{"current_steps": 6719, "total_steps": 7063, "loss": 0.0024, "reward": 0.0003, "learning_rate": 9.077252797618818e-06, "epoch": 0.95, "percentage": 95.13, "elapsed_time": "1 day, 16:23:47", "remaining_time": "2:04:05"} +{"current_steps": 6729, "total_steps": 7063, "loss": 0.0028, "reward": -0.0084, "learning_rate": 9.128089605327627e-06, "epoch": 0.95, "percentage": 95.27, "elapsed_time": "1 day, 16:27:22", "remaining_time": "2:00:29"} +{"current_steps": 6739, "total_steps": 7063, "loss": 0.0025, "reward": 0.0006, "learning_rate": 9.177620073685139e-06, "epoch": 0.95, "percentage": 95.41, "elapsed_time": "1 day, 16:30:57", "remaining_time": "1:56:52"} +{"current_steps": 6749, "total_steps": 7063, "loss": 0.0025, "reward": -0.0565, "learning_rate": 9.225828528709911e-06, "epoch": 0.96, "percentage": 95.55, "elapsed_time": "1 day, 16:34:41", "remaining_time": "1:53:16"} +{"current_steps": 6759, "total_steps": 7063, "loss": 0.0027, "reward": -0.2262, "learning_rate": 9.27269971477334e-06, "epoch": 0.96, "percentage": 95.7, "elapsed_time": "1 day, 16:38:15", "remaining_time": "1:49:39"} +{"current_steps": 6769, "total_steps": 7063, "loss": 0.0024, "reward": -0.2918, "learning_rate": 9.318218799427321e-06, "epoch": 0.96, "percentage": 95.84, "elapsed_time": "1 day, 16:41:52", "remaining_time": "1:46:03"} +{"current_steps": 6779, "total_steps": 7063, "loss": 0.0027, "reward": -0.1157, "learning_rate": 9.362371378098033e-06, "epoch": 0.96, "percentage": 95.98, "elapsed_time": "1 day, 16:45:31", "remaining_time": "1:42:27"} +{"current_steps": 6789, "total_steps": 7063, "loss": 0.0031, "reward": -0.1187, "learning_rate": 9.405143478644232e-06, "epoch": 0.96, "percentage": 96.12, "elapsed_time": "1 day, 16:49:05", "remaining_time": "1:38:50"} +{"current_steps": 6799, "total_steps": 7063, "loss": 0.0028, "reward": -0.0971, "learning_rate": 9.446521565778804e-06, "epoch": 0.96, "percentage": 96.26, "elapsed_time": "1 day, 16:52:40", "remaining_time": "1:35:14"} +{"current_steps": 6809, "total_steps": 7063, "loss": 0.0029, "reward": -0.0164, "learning_rate": 9.486492545351985e-06, "epoch": 0.96, "percentage": 96.4, "elapsed_time": "1 day, 16:56:15", "remaining_time": "1:31:37"} +{"current_steps": 6819, "total_steps": 7063, "loss": 0.0029, "reward": -0.2, "learning_rate": 9.525043768495047e-06, "epoch": 0.97, "percentage": 96.55, "elapsed_time": "1 day, 16:59:51", "remaining_time": "1:28:01"} +{"current_steps": 6829, "total_steps": 7063, "loss": 0.0022, "reward": 0.0569, "learning_rate": 9.562163035623038e-06, "epoch": 0.97, "percentage": 96.69, "elapsed_time": "1 day, 17:03:36", "remaining_time": "1:24:25"} +{"current_steps": 6839, "total_steps": 7063, "loss": 0.0023, "reward": -0.163, "learning_rate": 9.597838600295355e-06, "epoch": 0.97, "percentage": 96.83, "elapsed_time": "1 day, 17:07:16", "remaining_time": "1:20:48"} +{"current_steps": 6849, "total_steps": 7063, "loss": 0.0027, "reward": -0.1407, "learning_rate": 9.632059172932935e-06, "epoch": 0.97, "percentage": 96.97, "elapsed_time": "1 day, 17:10:54", "remaining_time": "1:17:12"} +{"current_steps": 6859, "total_steps": 7063, "loss": 0.0026, "reward": -0.1893, "learning_rate": 9.664813924390828e-06, "epoch": 0.97, "percentage": 97.11, "elapsed_time": "1 day, 17:14:31", "remaining_time": "1:13:35"} +{"current_steps": 6869, "total_steps": 7063, "loss": 0.0027, "reward": -0.0518, "learning_rate": 9.696092489385132e-06, "epoch": 0.97, "percentage": 97.25, "elapsed_time": "1 day, 17:18:03", "remaining_time": "1:09:59"} +{"current_steps": 6879, "total_steps": 7063, "loss": 0.0026, "reward": -0.1236, "learning_rate": 9.72588496977306e-06, "epoch": 0.97, "percentage": 97.39, "elapsed_time": "1 day, 17:21:36", "remaining_time": "1:06:22"} +{"current_steps": 6889, "total_steps": 7063, "loss": 0.0026, "reward": -0.2622, "learning_rate": 9.754181937685261e-06, "epoch": 0.98, "percentage": 97.54, "elapsed_time": "1 day, 17:25:09", "remaining_time": "1:02:46"} +{"current_steps": 6899, "total_steps": 7063, "loss": 0.0025, "reward": -0.1576, "learning_rate": 9.780974438509254e-06, "epoch": 0.98, "percentage": 97.68, "elapsed_time": "1 day, 17:28:48", "remaining_time": "0:59:09"} +{"current_steps": 6909, "total_steps": 7063, "loss": 0.0036, "reward": -0.0548, "learning_rate": 9.80625399372313e-06, "epoch": 0.98, "percentage": 97.82, "elapsed_time": "1 day, 17:32:15", "remaining_time": "0:55:33"} +{"current_steps": 6919, "total_steps": 7063, "loss": 0.0037, "reward": -0.219, "learning_rate": 9.8300126035786e-06, "epoch": 0.98, "percentage": 97.96, "elapsed_time": "1 day, 17:35:51", "remaining_time": "0:51:56"} +{"current_steps": 6929, "total_steps": 7063, "loss": 0.0028, "reward": -0.0597, "learning_rate": 9.852242749632524e-06, "epoch": 0.98, "percentage": 98.1, "elapsed_time": "1 day, 17:39:23", "remaining_time": "0:48:20"} +{"current_steps": 6939, "total_steps": 7063, "loss": 0.0024, "reward": -0.133, "learning_rate": 9.872937397126121e-06, "epoch": 0.98, "percentage": 98.24, "elapsed_time": "1 day, 17:43:02", "remaining_time": "0:44:43"} +{"current_steps": 6949, "total_steps": 7063, "loss": 0.0027, "reward": -0.0708, "learning_rate": 9.89208999721115e-06, "epoch": 0.98, "percentage": 98.39, "elapsed_time": "1 day, 17:46:38", "remaining_time": "0:41:07"} +{"current_steps": 6959, "total_steps": 7063, "loss": 0.0026, "reward": -0.0812, "learning_rate": 9.909694489022273e-06, "epoch": 0.99, "percentage": 98.53, "elapsed_time": "1 day, 17:50:14", "remaining_time": "0:37:30"} +{"current_steps": 6969, "total_steps": 7063, "loss": 0.0031, "reward": 0.0002, "learning_rate": 9.92574530159505e-06, "epoch": 0.99, "percentage": 98.67, "elapsed_time": "1 day, 17:53:50", "remaining_time": "0:33:54"} +{"current_steps": 6979, "total_steps": 7063, "loss": 0.003, "reward": 0.0289, "learning_rate": 9.940237355628861e-06, "epoch": 0.99, "percentage": 98.81, "elapsed_time": "1 day, 17:57:23", "remaining_time": "0:30:17"} +{"current_steps": 6989, "total_steps": 7063, "loss": 0.0029, "reward": -0.0353, "learning_rate": 9.95316606509427e-06, "epoch": 0.99, "percentage": 98.95, "elapsed_time": "1 day, 18:01:05", "remaining_time": "0:26:41"} +{"current_steps": 6999, "total_steps": 7063, "loss": 0.0023, "reward": -0.0618, "learning_rate": 9.964527338684262e-06, "epoch": 0.99, "percentage": 99.09, "elapsed_time": "1 day, 18:04:56", "remaining_time": "0:23:05"} +{"current_steps": 7009, "total_steps": 7063, "loss": 0.003, "reward": -0.1512, "learning_rate": 9.974317581108963e-06, "epoch": 0.99, "percentage": 99.24, "elapsed_time": "1 day, 18:08:26", "remaining_time": "0:19:28"} +{"current_steps": 7019, "total_steps": 7063, "loss": 0.0032, "reward": 0.0394, "learning_rate": 9.98253369423336e-06, "epoch": 0.99, "percentage": 99.38, "elapsed_time": "1 day, 18:11:56", "remaining_time": "0:15:52"} +{"current_steps": 7029, "total_steps": 7063, "loss": 0.0027, "reward": -0.081, "learning_rate": 9.989173078057715e-06, "epoch": 1.0, "percentage": 99.52, "elapsed_time": "1 day, 18:15:35", "remaining_time": "0:12:15"} +{"current_steps": 7039, "total_steps": 7063, "loss": 0.0028, "reward": -0.0309, "learning_rate": 9.99423363154034e-06, "epoch": 1.0, "percentage": 99.66, "elapsed_time": "1 day, 18:19:23", "remaining_time": "0:08:39"} +{"current_steps": 7049, "total_steps": 7063, "loss": 0.0025, "reward": -0.1167, "learning_rate": 9.99771375326247e-06, "epoch": 1.0, "percentage": 99.8, "elapsed_time": "1 day, 18:22:59", "remaining_time": "0:05:03"} +{"current_steps": 7059, "total_steps": 7063, "loss": 0.0024, "reward": -0.0893, "learning_rate": 9.999612341935039e-06, "epoch": 1.0, "percentage": 99.94, "elapsed_time": "1 day, 18:26:47", "remaining_time": "0:01:26"} diff --git a/ppo-lora/trainer_state.json b/ppo-lora/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..a518402d6cc81bfb090faed292b6f1c33e356bb5 --- /dev/null +++ b/ppo-lora/trainer_state.json @@ -0,0 +1,4958 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": null, + "global_step": 0, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.0, + "learning_rate": 9.999359182892298e-06, + "loss": 0.0058, + "reward": -0.5258, + "step": 9 + }, + { + "epoch": 0.0, + "learning_rate": 9.997144223525905e-06, + "loss": 0.0053, + "reward": -0.5235, + "step": 19 + }, + { + "epoch": 0.0, + "learning_rate": 9.993347911338379e-06, + "loss": 0.0063, + "reward": -0.5422, + "step": 29 + }, + { + "epoch": 0.01, + "learning_rate": 9.987971447677674e-06, + "loss": 0.0052, + "reward": -0.5766, + "step": 39 + }, + { + "epoch": 0.01, + "learning_rate": 9.981016533932741e-06, + "loss": 0.0042, + "reward": -0.3694, + "step": 49 + }, + { + "epoch": 0.01, + "learning_rate": 9.972485370995129e-06, + "loss": 0.004, + "reward": -0.346, + "step": 59 + }, + { + "epoch": 0.01, + "learning_rate": 9.962380658562499e-06, + "loss": 0.0047, + "reward": -0.4197, + "step": 69 + }, + { + "epoch": 0.01, + "learning_rate": 9.950705594284304e-06, + "loss": 0.0043, + "reward": -0.1848, + "step": 79 + }, + { + "epoch": 0.01, + "learning_rate": 9.937463872749902e-06, + "loss": 0.0046, + "reward": -0.4406, + "step": 89 + }, + { + "epoch": 0.01, + "learning_rate": 9.922659684319374e-06, + "loss": 0.0044, + "reward": -0.4997, + "step": 99 + }, + { + "epoch": 0.02, + "learning_rate": 9.906297713797501e-06, + "loss": 0.0048, + "reward": -0.4274, + "step": 109 + }, + { + "epoch": 0.02, + "learning_rate": 9.888383138951242e-06, + "loss": 0.0046, + "reward": -0.3451, + "step": 119 + }, + { + "epoch": 0.02, + "learning_rate": 9.868921628871223e-06, + "loss": 0.0051, + "reward": -0.4131, + "step": 129 + }, + { + "epoch": 0.02, + "learning_rate": 9.847919342177744e-06, + "loss": 0.004, + "reward": -0.2998, + "step": 139 + }, + { + "epoch": 0.02, + "learning_rate": 9.825382925071883e-06, + "loss": 0.0045, + "reward": -0.4068, + "step": 149 + }, + { + "epoch": 0.02, + "learning_rate": 9.801319509232287e-06, + "loss": 0.0051, + "reward": -0.4744, + "step": 159 + }, + { + "epoch": 0.02, + "learning_rate": 9.775736709558352e-06, + "loss": 0.0054, + "reward": -0.5511, + "step": 169 + }, + { + "epoch": 0.03, + "learning_rate": 9.748642621760474e-06, + "loss": 0.0055, + "reward": -0.2605, + "step": 179 + }, + { + "epoch": 0.03, + "learning_rate": 9.720045819798151e-06, + "loss": 0.0043, + "reward": -0.4817, + "step": 189 + }, + { + "epoch": 0.03, + "learning_rate": 9.68995535316674e-06, + "loss": 0.0061, + "reward": -0.3717, + "step": 199 + }, + { + "epoch": 0.03, + "learning_rate": 9.658380744033737e-06, + "loss": 0.0041, + "reward": -0.3632, + "step": 209 + }, + { + "epoch": 0.03, + "learning_rate": 9.625331984225475e-06, + "loss": 0.0039, + "reward": -0.4044, + "step": 219 + }, + { + "epoch": 0.03, + "learning_rate": 9.590819532065188e-06, + "loss": 0.0049, + "reward": -0.3763, + "step": 229 + }, + { + "epoch": 0.03, + "learning_rate": 9.554854309063474e-06, + "loss": 0.0053, + "reward": -0.3172, + "step": 239 + }, + { + "epoch": 0.04, + "learning_rate": 9.517447696462163e-06, + "loss": 0.0047, + "reward": -0.5815, + "step": 249 + }, + { + "epoch": 0.04, + "learning_rate": 9.478611531632702e-06, + "loss": 0.0048, + "reward": -0.35, + "step": 259 + }, + { + "epoch": 0.04, + "learning_rate": 9.438358104330215e-06, + "loss": 0.0054, + "reward": -0.4544, + "step": 269 + }, + { + "epoch": 0.04, + "learning_rate": 9.396700152804386e-06, + "loss": 0.0039, + "reward": -0.3515, + "step": 279 + }, + { + "epoch": 0.04, + "learning_rate": 9.353650859768423e-06, + "loss": 0.0052, + "reward": -0.3799, + "step": 289 + }, + { + "epoch": 0.04, + "learning_rate": 9.309223848227377e-06, + "loss": 0.0048, + "reward": -0.5378, + "step": 299 + }, + { + "epoch": 0.04, + "learning_rate": 9.26343317716712e-06, + "loss": 0.0057, + "reward": -0.4758, + "step": 309 + }, + { + "epoch": 0.05, + "learning_rate": 9.216293337105358e-06, + "loss": 0.0044, + "reward": -0.5203, + "step": 319 + }, + { + "epoch": 0.05, + "learning_rate": 9.167819245506095e-06, + "loss": 0.0054, + "reward": -0.5237, + "step": 329 + }, + { + "epoch": 0.05, + "learning_rate": 9.118026242058976e-06, + "loss": 0.0058, + "reward": -0.2535, + "step": 339 + }, + { + "epoch": 0.05, + "learning_rate": 9.066930083825025e-06, + "loss": 0.0067, + "reward": -0.5059, + "step": 349 + }, + { + "epoch": 0.05, + "learning_rate": 9.014546940250301e-06, + "loss": 0.0059, + "reward": -0.5255, + "step": 359 + }, + { + "epoch": 0.05, + "learning_rate": 8.960893388049056e-06, + "loss": 0.0047, + "reward": -0.3411, + "step": 369 + }, + { + "epoch": 0.05, + "learning_rate": 8.905986405958015e-06, + "loss": 0.0048, + "reward": -0.3859, + "step": 379 + }, + { + "epoch": 0.06, + "learning_rate": 8.849843369363425e-06, + "loss": 0.0058, + "reward": -0.3785, + "step": 389 + }, + { + "epoch": 0.06, + "learning_rate": 8.792482044802602e-06, + "loss": 0.0047, + "reward": -0.3432, + "step": 399 + }, + { + "epoch": 0.06, + "learning_rate": 8.733920584341673e-06, + "loss": 0.0057, + "reward": -0.3958, + "step": 409 + }, + { + "epoch": 0.06, + "learning_rate": 8.674177519831351e-06, + "loss": 0.0049, + "reward": -0.4713, + "step": 419 + }, + { + "epoch": 0.06, + "learning_rate": 8.613271757042483e-06, + "loss": 0.0048, + "reward": -0.4485, + "step": 429 + }, + { + "epoch": 0.06, + "learning_rate": 8.551222569683315e-06, + "loss": 0.0054, + "reward": -0.5861, + "step": 439 + }, + { + "epoch": 0.06, + "learning_rate": 8.488049593300287e-06, + "loss": 0.0052, + "reward": -0.292, + "step": 449 + }, + { + "epoch": 0.06, + "learning_rate": 8.423772819064349e-06, + "loss": 0.0049, + "reward": -0.4702, + "step": 459 + }, + { + "epoch": 0.07, + "learning_rate": 8.358412587444719e-06, + "loss": 0.0053, + "reward": -0.5542, + "step": 469 + }, + { + "epoch": 0.07, + "learning_rate": 8.291989581772126e-06, + "loss": 0.0048, + "reward": -0.4116, + "step": 479 + }, + { + "epoch": 0.07, + "learning_rate": 8.224524821693534e-06, + "loss": 0.005, + "reward": -0.3746, + "step": 489 + }, + { + "epoch": 0.07, + "learning_rate": 8.156039656520448e-06, + "loss": 0.0046, + "reward": -0.4481, + "step": 499 + }, + { + "epoch": 0.07, + "learning_rate": 8.086555758472905e-06, + "loss": 0.0043, + "reward": -0.4127, + "step": 509 + }, + { + "epoch": 0.07, + "learning_rate": 8.016095115821258e-06, + "loss": 0.0069, + "reward": -0.5597, + "step": 519 + }, + { + "epoch": 0.07, + "learning_rate": 7.944680025927976e-06, + "loss": 0.0061, + "reward": -0.4318, + "step": 529 + }, + { + "epoch": 0.08, + "learning_rate": 7.872333088191598e-06, + "loss": 0.0045, + "reward": -0.3063, + "step": 539 + }, + { + "epoch": 0.08, + "learning_rate": 7.799077196895131e-06, + "loss": 0.0048, + "reward": -0.3184, + "step": 549 + }, + { + "epoch": 0.08, + "learning_rate": 7.724935533961129e-06, + "loss": 0.0058, + "reward": -0.476, + "step": 559 + }, + { + "epoch": 0.08, + "learning_rate": 7.649931561615733e-06, + "loss": 0.0051, + "reward": -0.3959, + "step": 569 + }, + { + "epoch": 0.08, + "learning_rate": 7.574089014964029e-06, + "loss": 0.0051, + "reward": -0.4472, + "step": 579 + }, + { + "epoch": 0.08, + "learning_rate": 7.497431894479034e-06, + "loss": 0.0058, + "reward": -0.3736, + "step": 589 + }, + { + "epoch": 0.08, + "learning_rate": 7.419984458406722e-06, + "loss": 0.0043, + "reward": -0.4911, + "step": 599 + }, + { + "epoch": 0.09, + "learning_rate": 7.341771215089468e-06, + "loss": 0.005, + "reward": -0.3037, + "step": 609 + }, + { + "epoch": 0.09, + "learning_rate": 7.26281691521035e-06, + "loss": 0.0062, + "reward": -0.4219, + "step": 619 + }, + { + "epoch": 0.09, + "learning_rate": 7.183146543960761e-06, + "loss": 0.0051, + "reward": -0.3435, + "step": 629 + }, + { + "epoch": 0.09, + "learning_rate": 7.102785313133821e-06, + "loss": 0.0038, + "reward": -0.3745, + "step": 639 + }, + { + "epoch": 0.09, + "learning_rate": 7.021758653146058e-06, + "loss": 0.0053, + "reward": -0.3743, + "step": 649 + }, + { + "epoch": 0.09, + "learning_rate": 6.940092204989934e-06, + "loss": 0.006, + "reward": -0.4696, + "step": 659 + }, + { + "epoch": 0.09, + "learning_rate": 6.8578118121197144e-06, + "loss": 0.0058, + "reward": -0.4343, + "step": 669 + }, + { + "epoch": 0.1, + "learning_rate": 6.774943512273267e-06, + "loss": 0.0044, + "reward": -0.2842, + "step": 679 + }, + { + "epoch": 0.1, + "learning_rate": 6.691513529232391e-06, + "loss": 0.0046, + "reward": -0.345, + "step": 689 + }, + { + "epoch": 0.1, + "learning_rate": 6.607548264524268e-06, + "loss": 0.0047, + "reward": -0.3973, + "step": 699 + }, + { + "epoch": 0.1, + "learning_rate": 6.523074289066666e-06, + "loss": 0.0039, + "reward": -0.3412, + "step": 709 + }, + { + "epoch": 0.1, + "learning_rate": 6.43811833475953e-06, + "loss": 0.0054, + "reward": -0.3593, + "step": 719 + }, + { + "epoch": 0.1, + "learning_rate": 6.352707286025644e-06, + "loss": 0.0049, + "reward": -0.3673, + "step": 729 + }, + { + "epoch": 0.1, + "learning_rate": 6.266868171303017e-06, + "loss": 0.0046, + "reward": -0.4224, + "step": 739 + }, + { + "epoch": 0.11, + "learning_rate": 6.1806281544917e-06, + "loss": 0.0045, + "reward": -0.1521, + "step": 749 + }, + { + "epoch": 0.11, + "learning_rate": 6.094014526357734e-06, + "loss": 0.0056, + "reward": -0.3997, + "step": 759 + }, + { + "epoch": 0.11, + "learning_rate": 6.007054695896955e-06, + "loss": 0.0046, + "reward": -0.289, + "step": 769 + }, + { + "epoch": 0.11, + "learning_rate": 5.9197761816613705e-06, + "loss": 0.0042, + "reward": -0.3431, + "step": 779 + }, + { + "epoch": 0.11, + "learning_rate": 5.8322066030508924e-06, + "loss": 0.0049, + "reward": -0.3222, + "step": 789 + }, + { + "epoch": 0.11, + "learning_rate": 5.74437367157313e-06, + "loss": 0.0055, + "reward": -0.4949, + "step": 799 + }, + { + "epoch": 0.11, + "learning_rate": 5.656305182074053e-06, + "loss": 0.0065, + "reward": -0.4194, + "step": 809 + }, + { + "epoch": 0.12, + "learning_rate": 5.568029003942271e-06, + "loss": 0.005, + "reward": -0.5284, + "step": 819 + }, + { + "epoch": 0.12, + "learning_rate": 5.4795730722897435e-06, + "loss": 0.0058, + "reward": -0.5156, + "step": 829 + }, + { + "epoch": 0.12, + "learning_rate": 5.390965379111655e-06, + "loss": 0.0043, + "reward": -0.3164, + "step": 839 + }, + { + "epoch": 0.12, + "learning_rate": 5.302233964428329e-06, + "loss": 0.004, + "reward": -0.1936, + "step": 849 + }, + { + "epoch": 0.12, + "learning_rate": 5.213406907411921e-06, + "loss": 0.0039, + "reward": -0.2792, + "step": 859 + }, + { + "epoch": 0.12, + "learning_rate": 5.124512317500723e-06, + "loss": 0.005, + "reward": -0.2348, + "step": 869 + }, + { + "epoch": 0.12, + "learning_rate": 5.035578325503908e-06, + "loss": 0.0042, + "reward": -0.3528, + "step": 879 + }, + { + "epoch": 0.13, + "learning_rate": 4.946633074699485e-06, + "loss": 0.005, + "reward": -0.3753, + "step": 889 + }, + { + "epoch": 0.13, + "learning_rate": 4.857704711928325e-06, + "loss": 0.0052, + "reward": -0.4383, + "step": 899 + }, + { + "epoch": 0.13, + "learning_rate": 4.768821378687066e-06, + "loss": 0.0045, + "reward": -0.3664, + "step": 909 + }, + { + "epoch": 0.13, + "learning_rate": 4.6800112022226865e-06, + "loss": 0.0043, + "reward": -0.3584, + "step": 919 + }, + { + "epoch": 0.13, + "learning_rate": 4.591302286631612e-06, + "loss": 0.0048, + "reward": -0.455, + "step": 929 + }, + { + "epoch": 0.13, + "learning_rate": 4.502722703966126e-06, + "loss": 0.004, + "reward": -0.3906, + "step": 939 + }, + { + "epoch": 0.13, + "learning_rate": 4.414300485350945e-06, + "loss": 0.0046, + "reward": -0.4897, + "step": 949 + }, + { + "epoch": 0.14, + "learning_rate": 4.326063612112721e-06, + "loss": 0.0042, + "reward": -0.384, + "step": 959 + }, + { + "epoch": 0.14, + "learning_rate": 4.2380400069253255e-06, + "loss": 0.0039, + "reward": -0.4159, + "step": 969 + }, + { + "epoch": 0.14, + "learning_rate": 4.15025752497367e-06, + "loss": 0.0048, + "reward": -0.4036, + "step": 979 + }, + { + "epoch": 0.14, + "learning_rate": 4.062743945138906e-06, + "loss": 0.0042, + "reward": -0.4189, + "step": 989 + }, + { + "epoch": 0.14, + "learning_rate": 3.975526961207759e-06, + "loss": 0.005, + "reward": -0.2446, + "step": 999 + }, + { + "epoch": 0.14, + "learning_rate": 3.88863417310879e-06, + "loss": 0.0047, + "reward": -0.3705, + "step": 1009 + }, + { + "epoch": 0.14, + "learning_rate": 3.8020930781783704e-06, + "loss": 0.0048, + "reward": -0.3862, + "step": 1019 + }, + { + "epoch": 0.15, + "learning_rate": 3.7159310624591055e-06, + "loss": 0.0041, + "reward": -0.4077, + "step": 1029 + }, + { + "epoch": 0.15, + "learning_rate": 3.630175392033488e-06, + "loss": 0.0072, + "reward": -0.2784, + "step": 1039 + }, + { + "epoch": 0.15, + "learning_rate": 3.544853204395513e-06, + "loss": 0.0058, + "reward": -0.436, + "step": 1049 + }, + { + "epoch": 0.15, + "learning_rate": 3.45999149986298e-06, + "loss": 0.0045, + "reward": -0.3979, + "step": 1059 + }, + { + "epoch": 0.15, + "learning_rate": 3.375617133033209e-06, + "loss": 0.0055, + "reward": -0.4709, + "step": 1069 + }, + { + "epoch": 0.15, + "learning_rate": 3.2917568042848648e-06, + "loss": 0.0036, + "reward": -0.3748, + "step": 1079 + }, + { + "epoch": 0.15, + "learning_rate": 3.2167439478854534e-06, + "loss": 0.0057, + "reward": -0.586, + "step": 1089 + }, + { + "epoch": 0.16, + "learning_rate": 3.1339332616713215e-06, + "loss": 0.0047, + "reward": -0.2301, + "step": 1099 + }, + { + "epoch": 0.16, + "learning_rate": 3.051713094715606e-06, + "loss": 0.0052, + "reward": -0.4129, + "step": 1109 + }, + { + "epoch": 0.16, + "learning_rate": 2.9701094656976084e-06, + "loss": 0.0044, + "reward": -0.2389, + "step": 1119 + }, + { + "epoch": 0.16, + "learning_rate": 2.8891481981923897e-06, + "loss": 0.0039, + "reward": -0.3641, + "step": 1129 + }, + { + "epoch": 0.16, + "learning_rate": 2.8088549124988785e-06, + "loss": 0.0052, + "reward": -0.3099, + "step": 1139 + }, + { + "epoch": 0.16, + "learning_rate": 2.729255017532277e-06, + "loss": 0.0037, + "reward": -0.3203, + "step": 1149 + }, + { + "epoch": 0.16, + "learning_rate": 2.6503737027833926e-06, + "loss": 0.0052, + "reward": -0.4073, + "step": 1159 + }, + { + "epoch": 0.17, + "learning_rate": 2.5722359303473778e-06, + "loss": 0.0052, + "reward": -0.3275, + "step": 1169 + }, + { + "epoch": 0.17, + "learning_rate": 2.494866427024452e-06, + "loss": 0.004, + "reward": -0.3811, + "step": 1179 + }, + { + "epoch": 0.17, + "learning_rate": 2.4182896764950726e-06, + "loss": 0.0052, + "reward": -0.3413, + "step": 1189 + }, + { + "epoch": 0.17, + "learning_rate": 2.3425299115720295e-06, + "loss": 0.0052, + "reward": -0.5202, + "step": 1199 + }, + { + "epoch": 0.17, + "learning_rate": 2.267611106531961e-06, + "loss": 0.0048, + "reward": -0.3018, + "step": 1209 + }, + { + "epoch": 0.17, + "learning_rate": 2.193556969528642e-06, + "loss": 0.0056, + "reward": -0.4154, + "step": 1219 + }, + { + "epoch": 0.17, + "learning_rate": 2.1203909350905215e-06, + "loss": 0.0046, + "reward": -0.3844, + "step": 1229 + }, + { + "epoch": 0.18, + "learning_rate": 2.048136156704833e-06, + "loss": 0.0052, + "reward": -0.3442, + "step": 1239 + }, + { + "epoch": 0.18, + "learning_rate": 1.9768154994906352e-06, + "loss": 0.0053, + "reward": -0.357, + "step": 1249 + }, + { + "epoch": 0.18, + "learning_rate": 1.9064515329631267e-06, + "loss": 0.0043, + "reward": -0.2778, + "step": 1259 + }, + { + "epoch": 0.18, + "learning_rate": 1.837066523891483e-06, + "loss": 0.0066, + "reward": -0.3448, + "step": 1269 + }, + { + "epoch": 0.18, + "learning_rate": 1.768682429252519e-06, + "loss": 0.0051, + "reward": -0.3787, + "step": 1279 + }, + { + "epoch": 0.18, + "learning_rate": 1.7013208892823618e-06, + "loss": 0.004, + "reward": -0.4296, + "step": 1289 + }, + { + "epoch": 0.18, + "learning_rate": 1.6350032206283833e-06, + "loss": 0.0047, + "reward": -0.5144, + "step": 1299 + }, + { + "epoch": 0.19, + "learning_rate": 1.5697504096035116e-06, + "loss": 0.0052, + "reward": -0.331, + "step": 1309 + }, + { + "epoch": 0.19, + "learning_rate": 1.5055831055450825e-06, + "loss": 0.0039, + "reward": -0.3365, + "step": 1319 + }, + { + "epoch": 0.19, + "learning_rate": 1.4425216142803395e-06, + "loss": 0.0047, + "reward": -0.3728, + "step": 1329 + }, + { + "epoch": 0.19, + "learning_rate": 1.3805858917006148e-06, + "loss": 0.0048, + "reward": -0.3547, + "step": 1339 + }, + { + "epoch": 0.19, + "learning_rate": 1.3197955374462767e-06, + "loss": 0.0043, + "reward": -0.3398, + "step": 1349 + }, + { + "epoch": 0.19, + "learning_rate": 1.260169788704383e-06, + "loss": 0.0056, + "reward": -0.2891, + "step": 1359 + }, + { + "epoch": 0.19, + "learning_rate": 1.2017275141210604e-06, + "loss": 0.0042, + "reward": -0.3165, + "step": 1369 + }, + { + "epoch": 0.2, + "learning_rate": 1.1444872078304865e-06, + "loss": 0.0039, + "reward": -0.366, + "step": 1379 + }, + { + "epoch": 0.2, + "learning_rate": 1.0884669836024058e-06, + "loss": 0.004, + "reward": -0.2873, + "step": 1389 + }, + { + "epoch": 0.2, + "learning_rate": 1.033684569109994e-06, + "loss": 0.0046, + "reward": -0.2922, + "step": 1399 + }, + { + "epoch": 0.2, + "learning_rate": 9.80157300319926e-07, + "loss": 0.0037, + "reward": -0.3076, + "step": 1409 + }, + { + "epoch": 0.2, + "learning_rate": 9.279021160063712e-07, + "loss": 0.0066, + "reward": -0.5213, + "step": 1419 + }, + { + "epoch": 0.2, + "learning_rate": 8.769355523907086e-07, + "loss": 0.0044, + "reward": -0.5063, + "step": 1429 + }, + { + "epoch": 0.2, + "learning_rate": 8.272737379086088e-07, + "loss": 0.0041, + "reward": -0.5909, + "step": 1439 + }, + { + "epoch": 0.21, + "learning_rate": 7.789323881061777e-07, + "loss": 0.0044, + "reward": -0.2486, + "step": 1449 + }, + { + "epoch": 0.21, + "learning_rate": 7.31926800666744e-07, + "loss": 0.0044, + "reward": -0.4971, + "step": 1459 + }, + { + "epoch": 0.21, + "learning_rate": 6.862718505698945e-07, + "loss": 0.0043, + "reward": -0.5182, + "step": 1469 + }, + { + "epoch": 0.21, + "learning_rate": 6.419819853842591e-07, + "loss": 0.0046, + "reward": -0.2389, + "step": 1479 + }, + { + "epoch": 0.21, + "learning_rate": 5.990712206955674e-07, + "loss": 0.0039, + "reward": -0.3725, + "step": 1489 + }, + { + "epoch": 0.21, + "learning_rate": 5.575531356713904e-07, + "loss": 0.0046, + "reward": -0.4709, + "step": 1499 + }, + { + "epoch": 0.21, + "learning_rate": 5.17440868764002e-07, + "loss": 0.005, + "reward": -0.3545, + "step": 1509 + }, + { + "epoch": 0.22, + "learning_rate": 4.787471135526945e-07, + "loss": 0.0041, + "reward": -0.2898, + "step": 1519 + }, + { + "epoch": 0.22, + "learning_rate": 4.414841147268811e-07, + "loss": 0.0045, + "reward": -0.4093, + "step": 1529 + }, + { + "epoch": 0.22, + "learning_rate": 4.056636642112427e-07, + "loss": 0.004, + "reward": -0.3965, + "step": 1539 + }, + { + "epoch": 0.22, + "learning_rate": 3.7129709743416733e-07, + "loss": 0.0045, + "reward": -0.3877, + "step": 1549 + }, + { + "epoch": 0.22, + "learning_rate": 3.3839528974062843e-07, + "loss": 0.0046, + "reward": -0.3655, + "step": 1559 + }, + { + "epoch": 0.22, + "learning_rate": 3.069686529506777e-07, + "loss": 0.0045, + "reward": -0.5236, + "step": 1569 + }, + { + "epoch": 0.22, + "learning_rate": 2.770271320646023e-07, + "loss": 0.0053, + "reward": -0.441, + "step": 1579 + }, + { + "epoch": 0.22, + "learning_rate": 2.4858020211582346e-07, + "loss": 0.004, + "reward": -0.2618, + "step": 1589 + }, + { + "epoch": 0.23, + "learning_rate": 2.2163686517250427e-07, + "loss": 0.004, + "reward": -0.4623, + "step": 1599 + }, + { + "epoch": 0.23, + "learning_rate": 1.962056474888391e-07, + "loss": 0.0038, + "reward": -0.2542, + "step": 1609 + }, + { + "epoch": 0.23, + "learning_rate": 1.7229459680690176e-07, + "loss": 0.0051, + "reward": -0.377, + "step": 1619 + }, + { + "epoch": 0.23, + "learning_rate": 1.4991127980993503e-07, + "loss": 0.0046, + "reward": -0.3763, + "step": 1629 + }, + { + "epoch": 0.23, + "learning_rate": 1.290627797278593e-07, + "loss": 0.0046, + "reward": -0.4469, + "step": 1639 + }, + { + "epoch": 0.23, + "learning_rate": 1.0975569409577668e-07, + "loss": 0.0054, + "reward": -0.4301, + "step": 1649 + }, + { + "epoch": 0.23, + "learning_rate": 9.199613266616891e-08, + "loss": 0.0047, + "reward": -0.481, + "step": 1659 + }, + { + "epoch": 0.24, + "learning_rate": 7.578971547546554e-08, + "loss": 0.0047, + "reward": -0.549, + "step": 1669 + }, + { + "epoch": 0.24, + "learning_rate": 6.114157106556773e-08, + "loss": 0.0058, + "reward": -0.3571, + "step": 1679 + }, + { + "epoch": 0.24, + "learning_rate": 4.8056334860921426e-08, + "loss": 0.005, + "reward": -0.3539, + "step": 1689 + }, + { + "epoch": 0.24, + "learning_rate": 3.653814770162578e-08, + "loss": 0.0037, + "reward": -0.3161, + "step": 1699 + }, + { + "epoch": 0.24, + "learning_rate": 2.6590654533062975e-08, + "loss": 0.0053, + "reward": -0.4499, + "step": 1709 + }, + { + "epoch": 0.24, + "learning_rate": 1.821700325244813e-08, + "loss": 0.0047, + "reward": -0.3267, + "step": 1719 + }, + { + "epoch": 0.24, + "learning_rate": 1.141984371267335e-08, + "loss": 0.0043, + "reward": -0.4299, + "step": 1729 + }, + { + "epoch": 0.25, + "learning_rate": 6.2013268837601834e-09, + "loss": 0.0051, + "reward": -0.4119, + "step": 1739 + }, + { + "epoch": 0.25, + "learning_rate": 2.5631041721801976e-09, + "loss": 0.0048, + "reward": -0.492, + "step": 1749 + }, + { + "epoch": 0.25, + "learning_rate": 5.063268982646863e-10, + "loss": 0.0053, + "reward": -0.5111, + "step": 1759 + }, + { + "epoch": 0.25, + "learning_rate": 3.164593187165999e-11, + "loss": 0.0057, + "reward": -0.5665, + "step": 1769 + }, + { + "epoch": 0.25, + "learning_rate": 1.1392114864122727e-09, + "loss": 0.0039, + "reward": -0.3717, + "step": 1779 + }, + { + "epoch": 0.25, + "learning_rate": 3.828673071319955e-09, + "loss": 0.0049, + "reward": -0.4831, + "step": 1789 + }, + { + "epoch": 0.25, + "learning_rate": 8.099179602960583e-09, + "loss": 0.0052, + "reward": -0.4277, + "step": 1799 + }, + { + "epoch": 0.26, + "learning_rate": 1.3949379673960372e-08, + "loss": 0.0047, + "reward": -0.3236, + "step": 1809 + }, + { + "epoch": 0.26, + "learning_rate": 2.1377421980859903e-08, + "loss": 0.0044, + "reward": -0.4584, + "step": 1819 + }, + { + "epoch": 0.26, + "learning_rate": 3.0380955909962706e-08, + "loss": 0.004, + "reward": -0.427, + "step": 1829 + }, + { + "epoch": 0.26, + "learning_rate": 4.095713228118803e-08, + "loss": 0.0046, + "reward": -0.4793, + "step": 1839 + }, + { + "epoch": 0.26, + "learning_rate": 5.310260424970071e-08, + "loss": 0.005, + "reward": -0.3642, + "step": 1849 + }, + { + "epoch": 0.26, + "learning_rate": 6.681352836502009e-08, + "loss": 0.0036, + "reward": -0.3235, + "step": 1859 + }, + { + "epoch": 0.26, + "learning_rate": 8.208556578728933e-08, + "loss": 0.0055, + "reward": -0.4695, + "step": 1869 + }, + { + "epoch": 0.27, + "learning_rate": 9.891388366030486e-08, + "loss": 0.005, + "reward": -0.3998, + "step": 1879 + }, + { + "epoch": 0.27, + "learning_rate": 1.172931566408797e-07, + "loss": 0.0046, + "reward": -0.3878, + "step": 1889 + }, + { + "epoch": 0.27, + "learning_rate": 1.3721756858405545e-07, + "loss": 0.0055, + "reward": -0.5067, + "step": 1899 + }, + { + "epoch": 0.27, + "learning_rate": 1.5868081438363213e-07, + "loss": 0.0038, + "reward": -0.3747, + "step": 1909 + }, + { + "epoch": 0.27, + "learning_rate": 1.8167610196742125e-07, + "loss": 0.0052, + "reward": -0.2461, + "step": 1919 + }, + { + "epoch": 0.27, + "learning_rate": 2.0619615444661012e-07, + "loss": 0.0044, + "reward": -0.2565, + "step": 1929 + }, + { + "epoch": 0.27, + "learning_rate": 2.3223321241854335e-07, + "loss": 0.0045, + "reward": -0.4397, + "step": 1939 + }, + { + "epoch": 0.28, + "learning_rate": 2.5977903642219305e-07, + "loss": 0.0047, + "reward": -0.2828, + "step": 1949 + }, + { + "epoch": 0.28, + "learning_rate": 2.8882490954554976e-07, + "loss": 0.0049, + "reward": -0.361, + "step": 1959 + }, + { + "epoch": 0.28, + "learning_rate": 3.193616401840971e-07, + "loss": 0.0054, + "reward": -0.2941, + "step": 1969 + }, + { + "epoch": 0.28, + "learning_rate": 3.513795649495133e-07, + "loss": 0.0046, + "reward": -0.3027, + "step": 1979 + }, + { + "epoch": 0.28, + "learning_rate": 3.848685517276546e-07, + "loss": 0.0037, + "reward": -0.391, + "step": 1989 + }, + { + "epoch": 0.28, + "learning_rate": 4.1981800288488416e-07, + "loss": 0.0048, + "reward": -0.3608, + "step": 1999 + }, + { + "epoch": 0.28, + "learning_rate": 4.562168586217008e-07, + "loss": 0.0044, + "reward": -0.3958, + "step": 2009 + }, + { + "epoch": 0.29, + "learning_rate": 4.940536004726337e-07, + "loss": 0.0072, + "reward": -0.5123, + "step": 2019 + }, + { + "epoch": 0.29, + "learning_rate": 5.33316254951266e-07, + "loss": 0.0044, + "reward": -0.2958, + "step": 2029 + }, + { + "epoch": 0.29, + "learning_rate": 5.739923973392685e-07, + "loss": 0.0047, + "reward": -0.4311, + "step": 2039 + }, + { + "epoch": 0.29, + "learning_rate": 6.160691556182191e-07, + "loss": 0.0039, + "reward": -0.4388, + "step": 2049 + }, + { + "epoch": 0.29, + "learning_rate": 6.595332145429611e-07, + "loss": 0.0066, + "reward": -0.4963, + "step": 2059 + }, + { + "epoch": 0.29, + "learning_rate": 7.043708198552385e-07, + "loss": 0.0051, + "reward": -0.3088, + "step": 2069 + }, + { + "epoch": 0.29, + "learning_rate": 7.505677826362434e-07, + "loss": 0.0054, + "reward": -0.3397, + "step": 2079 + }, + { + "epoch": 0.3, + "learning_rate": 7.981094837967229e-07, + "loss": 0.0044, + "reward": -0.4052, + "step": 2089 + }, + { + "epoch": 0.3, + "learning_rate": 8.46980878703203e-07, + "loss": 0.0049, + "reward": -0.3994, + "step": 2099 + }, + { + "epoch": 0.3, + "learning_rate": 8.971665019388887e-07, + "loss": 0.0051, + "reward": -0.4254, + "step": 2109 + }, + { + "epoch": 0.3, + "learning_rate": 9.486504721977097e-07, + "loss": 0.0043, + "reward": -0.3374, + "step": 2119 + }, + { + "epoch": 0.3, + "learning_rate": 1.0014164973099866e-06, + "loss": 0.0058, + "reward": -0.3854, + "step": 2129 + }, + { + "epoch": 0.3, + "learning_rate": 1.0554478793981015e-06, + "loss": 0.0043, + "reward": -0.3606, + "step": 2139 + }, + { + "epoch": 0.3, + "learning_rate": 1.1107275201605728e-06, + "loss": 0.0041, + "reward": -0.3453, + "step": 2149 + }, + { + "epoch": 0.31, + "learning_rate": 1.1672379262828238e-06, + "loss": 0.008, + "reward": -0.3853, + "step": 2159 + }, + { + "epoch": 0.31, + "learning_rate": 1.2249612149729779e-06, + "loss": 0.0052, + "reward": -0.3406, + "step": 2169 + }, + { + "epoch": 0.31, + "learning_rate": 1.2838791196208771e-06, + "loss": 0.0043, + "reward": -0.3696, + "step": 2179 + }, + { + "epoch": 0.31, + "learning_rate": 1.3439729955785901e-06, + "loss": 0.0048, + "reward": -0.326, + "step": 2189 + }, + { + "epoch": 0.31, + "learning_rate": 1.40522382606052e-06, + "loss": 0.0048, + "reward": -0.3875, + "step": 2199 + }, + { + "epoch": 0.31, + "learning_rate": 1.4676122281613041e-06, + "loss": 0.0044, + "reward": -0.3224, + "step": 2209 + }, + { + "epoch": 0.31, + "learning_rate": 1.5311184589895495e-06, + "loss": 0.0054, + "reward": -0.4125, + "step": 2219 + }, + { + "epoch": 0.32, + "learning_rate": 1.595722421915507e-06, + "loss": 0.0051, + "reward": -0.5115, + "step": 2229 + }, + { + "epoch": 0.32, + "learning_rate": 1.6614036729306638e-06, + "loss": 0.0042, + "reward": -0.5107, + "step": 2239 + }, + { + "epoch": 0.32, + "learning_rate": 1.7281414271172925e-06, + "loss": 0.0048, + "reward": -0.4813, + "step": 2249 + }, + { + "epoch": 0.32, + "learning_rate": 1.7959145652258408e-06, + "loss": 0.0036, + "reward": -0.2592, + "step": 2259 + }, + { + "epoch": 0.32, + "learning_rate": 1.8647016403581763e-06, + "loss": 0.0045, + "reward": -0.431, + "step": 2269 + }, + { + "epoch": 0.32, + "learning_rate": 1.9344808847544632e-06, + "loss": 0.0045, + "reward": -0.3041, + "step": 2279 + }, + { + "epoch": 0.32, + "learning_rate": 2.0052302166816017e-06, + "loss": 0.0054, + "reward": -0.2746, + "step": 2289 + }, + { + "epoch": 0.33, + "learning_rate": 2.0769272474210374e-06, + "loss": 0.0059, + "reward": -0.5107, + "step": 2299 + }, + { + "epoch": 0.33, + "learning_rate": 2.149549288353676e-06, + "loss": 0.0044, + "reward": -0.3638, + "step": 2309 + }, + { + "epoch": 0.33, + "learning_rate": 2.2230733581397427e-06, + "loss": 0.0055, + "reward": -0.3426, + "step": 2319 + }, + { + "epoch": 0.33, + "learning_rate": 2.297476189991249e-06, + "loss": 0.0048, + "reward": -0.3561, + "step": 2329 + }, + { + "epoch": 0.33, + "learning_rate": 2.3727342390348134e-06, + "loss": 0.0058, + "reward": -0.334, + "step": 2339 + }, + { + "epoch": 0.33, + "learning_rate": 2.4488236897624457e-06, + "loss": 0.0043, + "reward": -0.188, + "step": 2349 + }, + { + "epoch": 0.33, + "learning_rate": 2.525720463568009e-06, + "loss": 0.005, + "reward": -0.3464, + "step": 2359 + }, + { + "epoch": 0.34, + "learning_rate": 2.603400226366919e-06, + "loss": 0.0041, + "reward": -0.4215, + "step": 2369 + }, + { + "epoch": 0.34, + "learning_rate": 2.6818383962967134e-06, + "loss": 0.0059, + "reward": -0.483, + "step": 2379 + }, + { + "epoch": 0.34, + "learning_rate": 2.7610101514959903e-06, + "loss": 0.0042, + "reward": -0.3055, + "step": 2389 + }, + { + "epoch": 0.34, + "learning_rate": 2.840890437959334e-06, + "loss": 0.0047, + "reward": -0.2254, + "step": 2399 + }, + { + "epoch": 0.34, + "learning_rate": 2.92145397746568e-06, + "loss": 0.0049, + "reward": -0.4363, + "step": 2409 + }, + { + "epoch": 0.34, + "learning_rate": 3.002675275577659e-06, + "loss": 0.0053, + "reward": -0.4156, + "step": 2419 + }, + { + "epoch": 0.34, + "learning_rate": 3.0845286297093167e-06, + "loss": 0.0032, + "reward": -0.3561, + "step": 2429 + }, + { + "epoch": 0.35, + "learning_rate": 3.166988137259751e-06, + "loss": 0.0039, + "reward": -0.4369, + "step": 2439 + }, + { + "epoch": 0.35, + "learning_rate": 3.2500277038100126e-06, + "loss": 0.0049, + "reward": -0.431, + "step": 2449 + }, + { + "epoch": 0.35, + "learning_rate": 3.3336210513807366e-06, + "loss": 0.0047, + "reward": -0.4215, + "step": 2459 + }, + { + "epoch": 0.35, + "learning_rate": 3.4177417267478236e-06, + "loss": 0.0044, + "reward": -0.2004, + "step": 2469 + }, + { + "epoch": 0.35, + "learning_rate": 3.502363109813589e-06, + "loss": 0.0039, + "reward": -0.3595, + "step": 2479 + }, + { + "epoch": 0.35, + "learning_rate": 3.5874584220307686e-06, + "loss": 0.0052, + "reward": -0.3384, + "step": 2489 + }, + { + "epoch": 0.35, + "learning_rate": 3.673000734876582e-06, + "loss": 0.0042, + "reward": -0.1973, + "step": 2499 + }, + { + "epoch": 0.36, + "learning_rate": 3.7589629783743188e-06, + "loss": 0.0044, + "reward": -0.4077, + "step": 2509 + }, + { + "epoch": 0.36, + "learning_rate": 3.845317949659662e-06, + "loss": 0.0046, + "reward": -0.5238, + "step": 2519 + }, + { + "epoch": 0.36, + "learning_rate": 3.932038321589086e-06, + "loss": 0.0039, + "reward": -0.3569, + "step": 2529 + }, + { + "epoch": 0.36, + "learning_rate": 4.01909665138754e-06, + "loss": 0.005, + "reward": -0.4477, + "step": 2539 + }, + { + "epoch": 0.36, + "learning_rate": 4.106465389332768e-06, + "loss": 0.0035, + "reward": -0.303, + "step": 2549 + }, + { + "epoch": 0.36, + "learning_rate": 4.194116887473445e-06, + "loss": 0.0042, + "reward": -0.3804, + "step": 2559 + }, + { + "epoch": 0.36, + "learning_rate": 4.282023408378429e-06, + "loss": 0.0047, + "reward": -0.4259, + "step": 2569 + }, + { + "epoch": 0.37, + "learning_rate": 4.370157133914274e-06, + "loss": 0.0049, + "reward": -0.3371, + "step": 2579 + }, + { + "epoch": 0.37, + "learning_rate": 4.458490174048339e-06, + "loss": 0.0047, + "reward": -0.4291, + "step": 2589 + }, + { + "epoch": 0.37, + "learning_rate": 4.5469945756746145e-06, + "loss": 0.0044, + "reward": -0.4106, + "step": 2599 + }, + { + "epoch": 0.37, + "learning_rate": 4.635642331459522e-06, + "loss": 0.0036, + "reward": -0.3657, + "step": 2609 + }, + { + "epoch": 0.37, + "learning_rate": 4.724405388704883e-06, + "loss": 0.0052, + "reward": -0.3857, + "step": 2619 + }, + { + "epoch": 0.37, + "learning_rate": 4.804367507873278e-06, + "loss": 0.0047, + "reward": -0.3853, + "step": 2629 + }, + { + "epoch": 0.37, + "learning_rate": 4.893272229193558e-06, + "loss": 0.0054, + "reward": -0.3366, + "step": 2639 + }, + { + "epoch": 0.38, + "learning_rate": 4.982210724656406e-06, + "loss": 0.005, + "reward": -0.4375, + "step": 2649 + }, + { + "epoch": 0.38, + "learning_rate": 5.071154849558693e-06, + "loss": 0.0043, + "reward": -0.3342, + "step": 2659 + }, + { + "epoch": 0.38, + "learning_rate": 5.160076457415833e-06, + "loss": 0.0047, + "reward": -0.4507, + "step": 2669 + }, + { + "epoch": 0.38, + "learning_rate": 5.248947408868792e-06, + "loss": 0.005, + "reward": -0.4391, + "step": 2679 + }, + { + "epoch": 0.38, + "learning_rate": 5.33773958058882e-06, + "loss": 0.0036, + "reward": -0.2586, + "step": 2689 + }, + { + "epoch": 0.38, + "learning_rate": 5.426424874177126e-06, + "loss": 0.0044, + "reward": -0.4199, + "step": 2699 + }, + { + "epoch": 0.38, + "learning_rate": 5.514975225056634e-06, + "loss": 0.0044, + "reward": -0.4119, + "step": 2709 + }, + { + "epoch": 0.38, + "learning_rate": 5.603362611353067e-06, + "loss": 0.0043, + "reward": -0.3747, + "step": 2719 + }, + { + "epoch": 0.39, + "learning_rate": 5.691559062762498e-06, + "loss": 0.0051, + "reward": -0.2529, + "step": 2729 + }, + { + "epoch": 0.39, + "learning_rate": 5.779536669402608e-06, + "loss": 0.0038, + "reward": -0.3863, + "step": 2739 + }, + { + "epoch": 0.39, + "learning_rate": 5.867267590644781e-06, + "loss": 0.0043, + "reward": -0.4039, + "step": 2749 + }, + { + "epoch": 0.39, + "learning_rate": 5.954724063924317e-06, + "loss": 0.0041, + "reward": -0.3328, + "step": 2759 + }, + { + "epoch": 0.39, + "learning_rate": 6.041878413525932e-06, + "loss": 0.0044, + "reward": -0.2204, + "step": 2769 + }, + { + "epoch": 0.39, + "learning_rate": 6.128703059341788e-06, + "loss": 0.0056, + "reward": -0.4904, + "step": 2779 + }, + { + "epoch": 0.39, + "learning_rate": 6.215170525599225e-06, + "loss": 0.0047, + "reward": -0.3944, + "step": 2789 + }, + { + "epoch": 0.4, + "learning_rate": 6.3012534495555275e-06, + "loss": 0.0053, + "reward": -0.5206, + "step": 2799 + }, + { + "epoch": 0.4, + "learning_rate": 6.386924590156891e-06, + "loss": 0.0033, + "reward": -0.1779, + "step": 2809 + }, + { + "epoch": 0.4, + "learning_rate": 6.4721568366589e-06, + "loss": 0.0045, + "reward": -0.4464, + "step": 2819 + }, + { + "epoch": 0.4, + "learning_rate": 6.556923217205744e-06, + "loss": 0.0036, + "reward": -0.3361, + "step": 2829 + }, + { + "epoch": 0.4, + "learning_rate": 6.641196907365499e-06, + "loss": 0.0049, + "reward": -0.5177, + "step": 2839 + }, + { + "epoch": 0.4, + "learning_rate": 6.724951238618763e-06, + "loss": 0.0048, + "reward": -0.4074, + "step": 2849 + }, + { + "epoch": 0.4, + "learning_rate": 6.808159706797949e-06, + "loss": 0.0047, + "reward": -0.2954, + "step": 2859 + }, + { + "epoch": 0.41, + "learning_rate": 6.8907959804745294e-06, + "loss": 0.0046, + "reward": -0.312, + "step": 2869 + }, + { + "epoch": 0.41, + "learning_rate": 6.972833909291694e-06, + "loss": 0.0053, + "reward": -0.4417, + "step": 2879 + }, + { + "epoch": 0.41, + "learning_rate": 7.054247532239634e-06, + "loss": 0.0036, + "reward": -0.2909, + "step": 2889 + }, + { + "epoch": 0.41, + "learning_rate": 7.135011085870964e-06, + "loss": 0.0044, + "reward": -0.2276, + "step": 2899 + }, + { + "epoch": 0.41, + "learning_rate": 7.21509901245357e-06, + "loss": 0.0049, + "reward": -0.3637, + "step": 2909 + }, + { + "epoch": 0.41, + "learning_rate": 7.294485968058404e-06, + "loss": 0.0067, + "reward": -0.3676, + "step": 2919 + }, + { + "epoch": 0.41, + "learning_rate": 7.373146830579596e-06, + "loss": 0.0034, + "reward": -0.1601, + "step": 2929 + }, + { + "epoch": 0.42, + "learning_rate": 7.451056707684396e-06, + "loss": 0.0041, + "reward": -0.1314, + "step": 2939 + }, + { + "epoch": 0.42, + "learning_rate": 7.528190944690356e-06, + "loss": 0.0035, + "reward": -0.2391, + "step": 2949 + }, + { + "epoch": 0.42, + "learning_rate": 7.6045251323673555e-06, + "loss": 0.0052, + "reward": -0.4042, + "step": 2959 + }, + { + "epoch": 0.42, + "learning_rate": 7.680035114661929e-06, + "loss": 0.0044, + "reward": -0.3035, + "step": 2969 + }, + { + "epoch": 0.42, + "learning_rate": 7.754696996341486e-06, + "loss": 0.0049, + "reward": -0.3552, + "step": 2979 + }, + { + "epoch": 0.42, + "learning_rate": 7.828487150555979e-06, + "loss": 0.0049, + "reward": -0.2459, + "step": 2989 + }, + { + "epoch": 0.42, + "learning_rate": 7.901382226314662e-06, + "loss": 0.0036, + "reward": -0.2989, + "step": 2999 + }, + { + "epoch": 0.43, + "learning_rate": 7.973359155875521e-06, + "loss": 0.0057, + "reward": -0.5494, + "step": 3009 + }, + { + "epoch": 0.43, + "learning_rate": 8.044395162045135e-06, + "loss": 0.0045, + "reward": -0.3344, + "step": 3019 + }, + { + "epoch": 0.43, + "learning_rate": 8.11446776538649e-06, + "loss": 0.0045, + "reward": -0.3949, + "step": 3029 + }, + { + "epoch": 0.43, + "learning_rate": 8.183554791332675e-06, + "loss": 0.004, + "reward": -0.2997, + "step": 3039 + }, + { + "epoch": 0.43, + "learning_rate": 8.251634377204023e-06, + "loss": 0.0034, + "reward": -0.2654, + "step": 3049 + }, + { + "epoch": 0.43, + "learning_rate": 8.318684979126607e-06, + "loss": 0.0034, + "reward": -0.4013, + "step": 3059 + }, + { + "epoch": 0.43, + "learning_rate": 8.384685378849804e-06, + "loss": 0.0035, + "reward": -0.4777, + "step": 3069 + }, + { + "epoch": 0.44, + "learning_rate": 8.44961469046086e-06, + "loss": 0.0031, + "reward": -0.3525, + "step": 3079 + }, + { + "epoch": 0.44, + "learning_rate": 8.513452366994242e-06, + "loss": 0.0042, + "reward": -0.1987, + "step": 3089 + }, + { + "epoch": 0.44, + "learning_rate": 8.576178206933773e-06, + "loss": 0.0043, + "reward": -0.439, + "step": 3099 + }, + { + "epoch": 0.44, + "learning_rate": 8.637772360605421e-06, + "loss": 0.0048, + "reward": -0.2539, + "step": 3109 + }, + { + "epoch": 0.44, + "learning_rate": 8.698215336458743e-06, + "loss": 0.0047, + "reward": -0.4092, + "step": 3119 + }, + { + "epoch": 0.44, + "learning_rate": 8.757488007235031e-06, + "loss": 0.0042, + "reward": -0.288, + "step": 3129 + }, + { + "epoch": 0.44, + "learning_rate": 8.815571616020147e-06, + "loss": 0.0033, + "reward": -0.2841, + "step": 3139 + }, + { + "epoch": 0.45, + "learning_rate": 8.872447782180168e-06, + "loss": 0.0044, + "reward": -0.3696, + "step": 3149 + }, + { + "epoch": 0.45, + "learning_rate": 8.92809850717797e-06, + "loss": 0.0034, + "reward": -0.1236, + "step": 3159 + }, + { + "epoch": 0.45, + "learning_rate": 8.982506180268895e-06, + "loss": 0.0041, + "reward": -0.269, + "step": 3169 + }, + { + "epoch": 0.45, + "learning_rate": 9.035653584073673e-06, + "loss": 0.0029, + "reward": -0.4326, + "step": 3179 + }, + { + "epoch": 0.45, + "learning_rate": 9.087523900026907e-06, + "loss": 0.0038, + "reward": -0.2885, + "step": 3189 + }, + { + "epoch": 0.45, + "learning_rate": 9.138100713699312e-06, + "loss": 0.0038, + "reward": -0.3119, + "step": 3199 + }, + { + "epoch": 0.45, + "learning_rate": 9.187368019992092e-06, + "loss": 0.004, + "reward": -0.196, + "step": 3209 + }, + { + "epoch": 0.46, + "learning_rate": 9.235310228201782e-06, + "loss": 0.0036, + "reward": -0.3683, + "step": 3219 + }, + { + "epoch": 0.46, + "learning_rate": 9.281912166953929e-06, + "loss": 0.0035, + "reward": -0.1997, + "step": 3229 + }, + { + "epoch": 0.46, + "learning_rate": 9.327159089004098e-06, + "loss": 0.0042, + "reward": -0.403, + "step": 3239 + }, + { + "epoch": 0.46, + "learning_rate": 9.371036675904667e-06, + "loss": 0.0034, + "reward": -0.3637, + "step": 3249 + }, + { + "epoch": 0.46, + "learning_rate": 9.413531042535915e-06, + "loss": 0.0049, + "reward": -0.3766, + "step": 3259 + }, + { + "epoch": 0.46, + "learning_rate": 9.454628741499976e-06, + "loss": 0.0044, + "reward": -0.3386, + "step": 3269 + }, + { + "epoch": 0.46, + "learning_rate": 9.494316767376295e-06, + "loss": 0.0039, + "reward": -0.3232, + "step": 3279 + }, + { + "epoch": 0.47, + "learning_rate": 9.532582560837204e-06, + "loss": 0.0032, + "reward": -0.3225, + "step": 3289 + }, + { + "epoch": 0.47, + "learning_rate": 9.569414012622356e-06, + "loss": 0.0037, + "reward": -0.3366, + "step": 3299 + }, + { + "epoch": 0.47, + "learning_rate": 9.604799467370689e-06, + "loss": 0.0038, + "reward": -0.3283, + "step": 3309 + }, + { + "epoch": 0.47, + "learning_rate": 9.63872772730879e-06, + "loss": 0.0033, + "reward": -0.2504, + "step": 3319 + }, + { + "epoch": 0.47, + "learning_rate": 9.671188055794462e-06, + "loss": 0.0037, + "reward": -0.3496, + "step": 3329 + }, + { + "epoch": 0.47, + "learning_rate": 9.702170180714328e-06, + "loss": 0.0035, + "reward": -0.3135, + "step": 3339 + }, + { + "epoch": 0.47, + "learning_rate": 9.731664297734458e-06, + "loss": 0.0036, + "reward": -0.3951, + "step": 3349 + }, + { + "epoch": 0.48, + "learning_rate": 9.75966107340297e-06, + "loss": 0.0032, + "reward": -0.4631, + "step": 3359 + }, + { + "epoch": 0.48, + "learning_rate": 9.786151648103613e-06, + "loss": 0.0036, + "reward": -0.3141, + "step": 3369 + }, + { + "epoch": 0.48, + "learning_rate": 9.811127638859398e-06, + "loss": 0.003, + "reward": -0.1992, + "step": 3379 + }, + { + "epoch": 0.48, + "learning_rate": 9.834581141985404e-06, + "loss": 0.0038, + "reward": -0.3201, + "step": 3389 + }, + { + "epoch": 0.48, + "learning_rate": 9.85650473558991e-06, + "loss": 0.0031, + "reward": -0.1577, + "step": 3399 + }, + { + "epoch": 0.48, + "learning_rate": 9.876891481923067e-06, + "loss": 0.0035, + "reward": -0.2635, + "step": 3409 + }, + { + "epoch": 0.48, + "learning_rate": 9.89573492957235e-06, + "loss": 0.0044, + "reward": -0.3539, + "step": 3419 + }, + { + "epoch": 0.49, + "learning_rate": 9.91302911550412e-06, + "loss": 0.0031, + "reward": -0.3358, + "step": 3429 + }, + { + "epoch": 0.49, + "learning_rate": 9.928768566950632e-06, + "loss": 0.0041, + "reward": -0.2885, + "step": 3439 + }, + { + "epoch": 0.49, + "learning_rate": 9.94294830314191e-06, + "loss": 0.0037, + "reward": -0.2699, + "step": 3449 + }, + { + "epoch": 0.49, + "learning_rate": 9.955563836881898e-06, + "loss": 0.0053, + "reward": -0.317, + "step": 3459 + }, + { + "epoch": 0.49, + "learning_rate": 9.966611175968454e-06, + "loss": 0.0035, + "reward": -0.2824, + "step": 3469 + }, + { + "epoch": 0.49, + "learning_rate": 9.976086824456686e-06, + "loss": 0.004, + "reward": -0.5046, + "step": 3479 + }, + { + "epoch": 0.49, + "learning_rate": 9.983987783765243e-06, + "loss": 0.0036, + "reward": -0.4293, + "step": 3489 + }, + { + "epoch": 0.5, + "learning_rate": 9.990311553625227e-06, + "loss": 0.0034, + "reward": -0.1845, + "step": 3499 + }, + { + "epoch": 0.5, + "learning_rate": 9.995056132871399e-06, + "loss": 0.0035, + "reward": -0.1239, + "step": 3509 + }, + { + "epoch": 0.5, + "learning_rate": 9.998220020075455e-06, + "loss": 0.0031, + "reward": -0.271, + "step": 3519 + }, + { + "epoch": 0.5, + "learning_rate": 9.999802214021156e-06, + "loss": 0.0039, + "reward": -0.4751, + "step": 3529 + }, + { + "epoch": 0.5, + "learning_rate": 9.999802214021156e-06, + "loss": 0.0038, + "reward": -0.454, + "step": 3539 + }, + { + "epoch": 0.5, + "learning_rate": 9.998220020075455e-06, + "loss": 0.0041, + "reward": -0.1722, + "step": 3549 + }, + { + "epoch": 0.5, + "learning_rate": 9.9950561328714e-06, + "loss": 0.0041, + "reward": -0.2842, + "step": 3559 + }, + { + "epoch": 0.51, + "learning_rate": 9.990311553625229e-06, + "loss": 0.0042, + "reward": -0.3914, + "step": 3569 + }, + { + "epoch": 0.51, + "learning_rate": 9.983987783765245e-06, + "loss": 0.0038, + "reward": -0.1993, + "step": 3579 + }, + { + "epoch": 0.51, + "learning_rate": 9.976086824456686e-06, + "loss": 0.0029, + "reward": -0.3465, + "step": 3589 + }, + { + "epoch": 0.51, + "learning_rate": 9.966611175968454e-06, + "loss": 0.0034, + "reward": -0.209, + "step": 3599 + }, + { + "epoch": 0.51, + "learning_rate": 9.955563836881898e-06, + "loss": 0.0032, + "reward": -0.2638, + "step": 3609 + }, + { + "epoch": 0.51, + "learning_rate": 9.94294830314191e-06, + "loss": 0.0032, + "reward": -0.2811, + "step": 3619 + }, + { + "epoch": 0.51, + "learning_rate": 9.928768566950635e-06, + "loss": 0.0038, + "reward": -0.3794, + "step": 3629 + }, + { + "epoch": 0.52, + "learning_rate": 9.91302911550412e-06, + "loss": 0.0038, + "reward": -0.3419, + "step": 3639 + }, + { + "epoch": 0.52, + "learning_rate": 9.89573492957235e-06, + "loss": 0.0032, + "reward": -0.31, + "step": 3649 + }, + { + "epoch": 0.52, + "learning_rate": 9.876891481923067e-06, + "loss": 0.0034, + "reward": -0.1604, + "step": 3659 + }, + { + "epoch": 0.52, + "learning_rate": 9.85650473558991e-06, + "loss": 0.0035, + "reward": -0.1379, + "step": 3669 + }, + { + "epoch": 0.52, + "learning_rate": 9.834581141985404e-06, + "loss": 0.0038, + "reward": -0.3531, + "step": 3679 + }, + { + "epoch": 0.52, + "learning_rate": 9.811127638859398e-06, + "loss": 0.0028, + "reward": -0.1161, + "step": 3689 + }, + { + "epoch": 0.52, + "learning_rate": 9.786151648103615e-06, + "loss": 0.0038, + "reward": -0.3628, + "step": 3699 + }, + { + "epoch": 0.53, + "learning_rate": 9.759661073402971e-06, + "loss": 0.0033, + "reward": -0.3243, + "step": 3709 + }, + { + "epoch": 0.53, + "learning_rate": 9.731664297734458e-06, + "loss": 0.0028, + "reward": -0.2481, + "step": 3719 + }, + { + "epoch": 0.53, + "learning_rate": 9.702170180714325e-06, + "loss": 0.0038, + "reward": -0.3179, + "step": 3729 + }, + { + "epoch": 0.53, + "learning_rate": 9.671188055794462e-06, + "loss": 0.0028, + "reward": -0.1725, + "step": 3739 + }, + { + "epoch": 0.53, + "learning_rate": 9.63872772730879e-06, + "loss": 0.003, + "reward": -0.1697, + "step": 3749 + }, + { + "epoch": 0.53, + "learning_rate": 9.604799467370689e-06, + "loss": 0.0035, + "reward": -0.2575, + "step": 3759 + }, + { + "epoch": 0.53, + "learning_rate": 9.569414012622358e-06, + "loss": 0.0043, + "reward": -0.3233, + "step": 3769 + }, + { + "epoch": 0.54, + "learning_rate": 9.532582560837208e-06, + "loss": 0.0031, + "reward": -0.0708, + "step": 3779 + }, + { + "epoch": 0.54, + "learning_rate": 9.494316767376295e-06, + "loss": 0.003, + "reward": -0.2344, + "step": 3789 + }, + { + "epoch": 0.54, + "learning_rate": 9.454628741499978e-06, + "loss": 0.0036, + "reward": -0.0844, + "step": 3799 + }, + { + "epoch": 0.54, + "learning_rate": 9.413531042535916e-06, + "loss": 0.0034, + "reward": -0.2369, + "step": 3809 + }, + { + "epoch": 0.54, + "learning_rate": 9.371036675904671e-06, + "loss": 0.0036, + "reward": -0.3654, + "step": 3819 + }, + { + "epoch": 0.54, + "learning_rate": 9.327159089004098e-06, + "loss": 0.0036, + "reward": -0.2757, + "step": 3829 + }, + { + "epoch": 0.54, + "learning_rate": 9.281912166953932e-06, + "loss": 0.0035, + "reward": -0.3181, + "step": 3839 + }, + { + "epoch": 0.54, + "learning_rate": 9.235310228201784e-06, + "loss": 0.0048, + "reward": -0.3122, + "step": 3849 + }, + { + "epoch": 0.55, + "learning_rate": 9.187368019992095e-06, + "loss": 0.0033, + "reward": -0.2904, + "step": 3859 + }, + { + "epoch": 0.55, + "learning_rate": 9.138100713699312e-06, + "loss": 0.0037, + "reward": -0.1489, + "step": 3869 + }, + { + "epoch": 0.55, + "learning_rate": 9.087523900026905e-06, + "loss": 0.0029, + "reward": -0.2763, + "step": 3879 + }, + { + "epoch": 0.55, + "learning_rate": 9.035653584073675e-06, + "loss": 0.003, + "reward": -0.1622, + "step": 3889 + }, + { + "epoch": 0.55, + "learning_rate": 8.982506180268893e-06, + "loss": 0.0034, + "reward": -0.3107, + "step": 3899 + }, + { + "epoch": 0.55, + "learning_rate": 8.928098507177972e-06, + "loss": 0.0033, + "reward": -0.1224, + "step": 3909 + }, + { + "epoch": 0.55, + "learning_rate": 8.872447782180166e-06, + "loss": 0.0038, + "reward": -0.1105, + "step": 3919 + }, + { + "epoch": 0.56, + "learning_rate": 8.815571616020149e-06, + "loss": 0.0031, + "reward": -0.348, + "step": 3929 + }, + { + "epoch": 0.56, + "learning_rate": 8.757488007235031e-06, + "loss": 0.0035, + "reward": -0.2409, + "step": 3939 + }, + { + "epoch": 0.56, + "learning_rate": 8.698215336458744e-06, + "loss": 0.0033, + "reward": -0.3141, + "step": 3949 + }, + { + "epoch": 0.56, + "learning_rate": 8.637772360605418e-06, + "loss": 0.0034, + "reward": -0.313, + "step": 3959 + }, + { + "epoch": 0.56, + "learning_rate": 8.576178206933775e-06, + "loss": 0.0046, + "reward": -0.4326, + "step": 3969 + }, + { + "epoch": 0.56, + "learning_rate": 8.513452366994239e-06, + "loss": 0.003, + "reward": -0.1198, + "step": 3979 + }, + { + "epoch": 0.56, + "learning_rate": 8.44961469046086e-06, + "loss": 0.0032, + "reward": -0.1191, + "step": 3989 + }, + { + "epoch": 0.57, + "learning_rate": 8.384685378849806e-06, + "loss": 0.0041, + "reward": -0.3557, + "step": 3999 + }, + { + "epoch": 0.57, + "learning_rate": 8.318684979126612e-06, + "loss": 0.0035, + "reward": -0.2939, + "step": 4009 + }, + { + "epoch": 0.57, + "learning_rate": 8.251634377204026e-06, + "loss": 0.0049, + "reward": -0.1952, + "step": 4019 + }, + { + "epoch": 0.57, + "learning_rate": 8.183554791332677e-06, + "loss": 0.0029, + "reward": -0.1551, + "step": 4029 + }, + { + "epoch": 0.57, + "learning_rate": 8.114467765386494e-06, + "loss": 0.0043, + "reward": -0.2539, + "step": 4039 + }, + { + "epoch": 0.57, + "learning_rate": 8.04439516204514e-06, + "loss": 0.0037, + "reward": -0.3849, + "step": 4049 + }, + { + "epoch": 0.57, + "learning_rate": 7.973359155875525e-06, + "loss": 0.0028, + "reward": -0.2593, + "step": 4059 + }, + { + "epoch": 0.58, + "learning_rate": 7.901382226314662e-06, + "loss": 0.0032, + "reward": -0.1569, + "step": 4069 + }, + { + "epoch": 0.58, + "learning_rate": 7.82848715055598e-06, + "loss": 0.0035, + "reward": -0.4049, + "step": 4079 + }, + { + "epoch": 0.58, + "learning_rate": 7.75469699634149e-06, + "loss": 0.0031, + "reward": -0.3131, + "step": 4089 + }, + { + "epoch": 0.58, + "learning_rate": 7.68003511466193e-06, + "loss": 0.0033, + "reward": -0.2798, + "step": 4099 + }, + { + "epoch": 0.58, + "learning_rate": 7.604525132367354e-06, + "loss": 0.0034, + "reward": -0.2349, + "step": 4109 + }, + { + "epoch": 0.58, + "learning_rate": 7.528190944690358e-06, + "loss": 0.0034, + "reward": -0.1358, + "step": 4119 + }, + { + "epoch": 0.58, + "learning_rate": 7.4510567076843945e-06, + "loss": 0.0034, + "reward": -0.1241, + "step": 4129 + }, + { + "epoch": 0.59, + "learning_rate": 7.373146830579598e-06, + "loss": 0.0031, + "reward": -0.0964, + "step": 4139 + }, + { + "epoch": 0.59, + "learning_rate": 7.294485968058401e-06, + "loss": 0.003, + "reward": -0.064, + "step": 4149 + }, + { + "epoch": 0.59, + "learning_rate": 7.2150990124535726e-06, + "loss": 0.0031, + "reward": -0.2023, + "step": 4159 + }, + { + "epoch": 0.59, + "learning_rate": 7.135011085870962e-06, + "loss": 0.0035, + "reward": -0.3227, + "step": 4169 + }, + { + "epoch": 0.59, + "learning_rate": 7.054247532239637e-06, + "loss": 0.003, + "reward": -0.1747, + "step": 4179 + }, + { + "epoch": 0.59, + "learning_rate": 6.9728339092916915e-06, + "loss": 0.003, + "reward": -0.1391, + "step": 4189 + }, + { + "epoch": 0.59, + "learning_rate": 6.890795980474532e-06, + "loss": 0.0029, + "reward": -0.1152, + "step": 4199 + }, + { + "epoch": 0.6, + "learning_rate": 6.808159706797946e-06, + "loss": 0.0027, + "reward": -0.225, + "step": 4209 + }, + { + "epoch": 0.6, + "learning_rate": 6.72495123861877e-06, + "loss": 0.0035, + "reward": -0.107, + "step": 4219 + }, + { + "epoch": 0.6, + "learning_rate": 6.6411969073655014e-06, + "loss": 0.0037, + "reward": -0.213, + "step": 4229 + }, + { + "epoch": 0.6, + "learning_rate": 6.55692321720575e-06, + "loss": 0.0029, + "reward": -0.2639, + "step": 4239 + }, + { + "epoch": 0.6, + "learning_rate": 6.472156836658903e-06, + "loss": 0.0034, + "reward": -0.1981, + "step": 4249 + }, + { + "epoch": 0.6, + "learning_rate": 6.386924590156898e-06, + "loss": 0.0035, + "reward": -0.1908, + "step": 4259 + }, + { + "epoch": 0.6, + "learning_rate": 6.301253449555531e-06, + "loss": 0.0028, + "reward": -0.2391, + "step": 4269 + }, + { + "epoch": 0.61, + "learning_rate": 6.215170525599231e-06, + "loss": 0.0032, + "reward": -0.2446, + "step": 4279 + }, + { + "epoch": 0.61, + "learning_rate": 6.128703059341789e-06, + "loss": 0.0032, + "reward": -0.2266, + "step": 4289 + }, + { + "epoch": 0.61, + "learning_rate": 6.041878413525939e-06, + "loss": 0.0032, + "reward": -0.1362, + "step": 4299 + }, + { + "epoch": 0.61, + "learning_rate": 5.9547240639243184e-06, + "loss": 0.0035, + "reward": -0.2071, + "step": 4309 + }, + { + "epoch": 0.61, + "learning_rate": 5.867267590644787e-06, + "loss": 0.0035, + "reward": -0.2041, + "step": 4319 + }, + { + "epoch": 0.61, + "learning_rate": 5.779536669402611e-06, + "loss": 0.0029, + "reward": -0.2125, + "step": 4329 + }, + { + "epoch": 0.61, + "learning_rate": 5.6915590627625005e-06, + "loss": 0.0033, + "reward": -0.3047, + "step": 4339 + }, + { + "epoch": 0.62, + "learning_rate": 5.60336261135307e-06, + "loss": 0.0028, + "reward": -0.2644, + "step": 4349 + }, + { + "epoch": 0.62, + "learning_rate": 5.514975225056633e-06, + "loss": 0.0032, + "reward": -0.2142, + "step": 4359 + }, + { + "epoch": 0.62, + "learning_rate": 5.4264248741771295e-06, + "loss": 0.0036, + "reward": -0.2406, + "step": 4369 + }, + { + "epoch": 0.62, + "learning_rate": 5.337739580588822e-06, + "loss": 0.0035, + "reward": -0.4047, + "step": 4379 + }, + { + "epoch": 0.62, + "learning_rate": 5.248947408868794e-06, + "loss": 0.0034, + "reward": -0.1619, + "step": 4389 + }, + { + "epoch": 0.62, + "learning_rate": 5.16007645741583e-06, + "loss": 0.0028, + "reward": -0.1479, + "step": 4399 + }, + { + "epoch": 0.62, + "learning_rate": 5.071154849558695e-06, + "loss": 0.0034, + "reward": -0.1027, + "step": 4409 + }, + { + "epoch": 0.63, + "learning_rate": 4.982210724656409e-06, + "loss": 0.0034, + "reward": -0.2996, + "step": 4419 + }, + { + "epoch": 0.63, + "learning_rate": 4.893272229193561e-06, + "loss": 0.0028, + "reward": -0.0919, + "step": 4429 + }, + { + "epoch": 0.63, + "learning_rate": 4.804367507873277e-06, + "loss": 0.003, + "reward": -0.1089, + "step": 4439 + }, + { + "epoch": 0.63, + "learning_rate": 4.715524694710839e-06, + "loss": 0.0031, + "reward": -0.1168, + "step": 4449 + }, + { + "epoch": 0.63, + "learning_rate": 4.626771904130584e-06, + "loss": 0.0034, + "reward": -0.3128, + "step": 4459 + }, + { + "epoch": 0.63, + "learning_rate": 4.538137222069105e-06, + "loss": 0.0041, + "reward": -0.1848, + "step": 4469 + }, + { + "epoch": 0.63, + "learning_rate": 4.449648697087378e-06, + "loss": 0.0032, + "reward": -0.1865, + "step": 4479 + }, + { + "epoch": 0.64, + "learning_rate": 4.361334331494812e-06, + "loss": 0.0027, + "reward": -0.1697, + "step": 4489 + }, + { + "epoch": 0.64, + "learning_rate": 4.2732220724878194e-06, + "loss": 0.0035, + "reward": -0.1667, + "step": 4499 + }, + { + "epoch": 0.64, + "learning_rate": 4.185339803305934e-06, + "loss": 0.0038, + "reward": -0.3111, + "step": 4509 + }, + { + "epoch": 0.64, + "learning_rate": 4.097715334408112e-06, + "loss": 0.003, + "reward": -0.2045, + "step": 4519 + }, + { + "epoch": 0.64, + "learning_rate": 4.010376394672062e-06, + "loss": 0.0031, + "reward": -0.152, + "step": 4529 + }, + { + "epoch": 0.64, + "learning_rate": 3.9233506226194126e-06, + "loss": 0.003, + "reward": -0.2064, + "step": 4539 + }, + { + "epoch": 0.64, + "learning_rate": 3.836665557669496e-06, + "loss": 0.0034, + "reward": -0.2407, + "step": 4549 + }, + { + "epoch": 0.65, + "learning_rate": 3.750348631424402e-06, + "loss": 0.0029, + "reward": -0.1174, + "step": 4559 + }, + { + "epoch": 0.65, + "learning_rate": 3.66442715898827e-06, + "loss": 0.003, + "reward": -0.2606, + "step": 4569 + }, + { + "epoch": 0.65, + "learning_rate": 3.578928330323367e-06, + "loss": 0.003, + "reward": -0.1689, + "step": 4579 + }, + { + "epoch": 0.65, + "learning_rate": 3.493879201645759e-06, + "loss": 0.0028, + "reward": -0.2151, + "step": 4589 + }, + { + "epoch": 0.65, + "learning_rate": 3.409306686863399e-06, + "loss": 0.0029, + "reward": -0.1513, + "step": 4599 + }, + { + "epoch": 0.65, + "learning_rate": 3.3252375490591217e-06, + "loss": 0.0026, + "reward": -0.0821, + "step": 4609 + }, + { + "epoch": 0.65, + "learning_rate": 3.24169839202147e-06, + "loss": 0.0034, + "reward": -0.2608, + "step": 4619 + }, + { + "epoch": 0.66, + "learning_rate": 3.158715651825871e-06, + "loss": 0.0028, + "reward": -0.132, + "step": 4629 + }, + { + "epoch": 0.66, + "learning_rate": 3.076315588468941e-06, + "loss": 0.0028, + "reward": -0.0714, + "step": 4639 + }, + { + "epoch": 0.66, + "learning_rate": 2.9945242775584143e-06, + "loss": 0.0032, + "reward": -0.2108, + "step": 4649 + }, + { + "epoch": 0.66, + "learning_rate": 2.913367602061552e-06, + "loss": 0.0027, + "reward": -0.0474, + "step": 4659 + }, + { + "epoch": 0.66, + "learning_rate": 2.832871244114375e-06, + "loss": 0.0033, + "reward": -0.287, + "step": 4669 + }, + { + "epoch": 0.66, + "learning_rate": 2.753060676894588e-06, + "loss": 0.0029, + "reward": -0.2081, + "step": 4679 + }, + { + "epoch": 0.66, + "learning_rate": 2.6739611565604947e-06, + "loss": 0.0036, + "reward": -0.1504, + "step": 4689 + }, + { + "epoch": 0.67, + "learning_rate": 2.5955977142586946e-06, + "loss": 0.0033, + "reward": -0.2813, + "step": 4699 + }, + { + "epoch": 0.67, + "learning_rate": 2.5179951482029225e-06, + "loss": 0.0029, + "reward": -0.3317, + "step": 4709 + }, + { + "epoch": 0.67, + "learning_rate": 2.4411780158266533e-06, + "loss": 0.0029, + "reward": -0.1715, + "step": 4719 + }, + { + "epoch": 0.67, + "learning_rate": 2.3651706260118184e-06, + "loss": 0.0029, + "reward": -0.1342, + "step": 4729 + }, + { + "epoch": 0.67, + "learning_rate": 2.289997031396286e-06, + "loss": 0.0032, + "reward": -0.0324, + "step": 4739 + }, + { + "epoch": 0.67, + "learning_rate": 2.215681020762313e-06, + "loss": 0.0032, + "reward": -0.1613, + "step": 4749 + }, + { + "epoch": 0.67, + "learning_rate": 2.1422461115086167e-06, + "loss": 0.0027, + "reward": -0.2861, + "step": 4759 + }, + { + "epoch": 0.68, + "learning_rate": 2.069715542208207e-06, + "loss": 0.0026, + "reward": -0.181, + "step": 4769 + }, + { + "epoch": 0.68, + "learning_rate": 1.998112265254541e-06, + "loss": 0.0028, + "reward": -0.1974, + "step": 4779 + }, + { + "epoch": 0.68, + "learning_rate": 1.9274589395981937e-06, + "loss": 0.0036, + "reward": -0.2612, + "step": 4789 + }, + { + "epoch": 0.68, + "learning_rate": 1.8577779235764249e-06, + "loss": 0.0031, + "reward": -0.1949, + "step": 4799 + }, + { + "epoch": 0.68, + "learning_rate": 1.7890912678378392e-06, + "loss": 0.0033, + "reward": -0.1398, + "step": 4809 + }, + { + "epoch": 0.68, + "learning_rate": 1.7214207083644098e-06, + "loss": 0.0032, + "reward": -0.1068, + "step": 4819 + }, + { + "epoch": 0.68, + "learning_rate": 1.6547876595931444e-06, + "loss": 0.0028, + "reward": -0.2427, + "step": 4829 + }, + { + "epoch": 0.69, + "learning_rate": 1.5892132076394151e-06, + "loss": 0.0031, + "reward": -0.0524, + "step": 4839 + }, + { + "epoch": 0.69, + "learning_rate": 1.524718103624252e-06, + "loss": 0.0029, + "reward": -0.1146, + "step": 4849 + }, + { + "epoch": 0.69, + "learning_rate": 1.4613227571076138e-06, + "loss": 0.0029, + "reward": -0.1041, + "step": 4859 + }, + { + "epoch": 0.69, + "learning_rate": 1.3990472296297808e-06, + "loss": 0.0025, + "reward": -0.2616, + "step": 4869 + }, + { + "epoch": 0.69, + "learning_rate": 1.3379112283628081e-06, + "loss": 0.0029, + "reward": -0.187, + "step": 4879 + }, + { + "epoch": 0.69, + "learning_rate": 1.2779340998742185e-06, + "loss": 0.0032, + "reward": -0.1955, + "step": 4889 + }, + { + "epoch": 0.69, + "learning_rate": 1.219134824004704e-06, + "loss": 0.0028, + "reward": -0.106, + "step": 4899 + }, + { + "epoch": 0.7, + "learning_rate": 1.16153200786198e-06, + "loss": 0.0032, + "reward": -0.2001, + "step": 4909 + }, + { + "epoch": 0.7, + "learning_rate": 1.1051438799324999e-06, + "loss": 0.0029, + "reward": -0.1302, + "step": 4919 + }, + { + "epoch": 0.7, + "learning_rate": 1.0499882843130487e-06, + "loss": 0.0032, + "reward": -0.2308, + "step": 4929 + }, + { + "epoch": 0.7, + "learning_rate": 9.96082675063948e-07, + "loss": 0.0028, + "reward": -0.2366, + "step": 4939 + }, + { + "epoch": 0.7, + "learning_rate": 9.43444110685714e-07, + "loss": 0.003, + "reward": -0.1516, + "step": 4949 + }, + { + "epoch": 0.7, + "learning_rate": 8.920892487208343e-07, + "loss": 0.0034, + "reward": 0.0169, + "step": 4959 + }, + { + "epoch": 0.7, + "learning_rate": 8.420343404825132e-07, + "loss": 0.0026, + "reward": -0.0979, + "step": 4969 + }, + { + "epoch": 0.7, + "learning_rate": 7.932952259118776e-07, + "loss": 0.003, + "reward": -0.1379, + "step": 4979 + }, + { + "epoch": 0.71, + "learning_rate": 7.458873285654489e-07, + "loss": 0.0035, + "reward": -0.0396, + "step": 4989 + }, + { + "epoch": 0.71, + "learning_rate": 6.998256507343016e-07, + "loss": 0.0027, + "reward": 0.0041, + "step": 4999 + }, + { + "epoch": 0.71, + "learning_rate": 6.551247686965872e-07, + "loss": 0.0034, + "reward": -0.1662, + "step": 5009 + }, + { + "epoch": 0.71, + "learning_rate": 6.117988281048626e-07, + "loss": 0.0032, + "reward": -0.1413, + "step": 5019 + }, + { + "epoch": 0.71, + "learning_rate": 5.698615395096485e-07, + "loss": 0.0029, + "reward": -0.2091, + "step": 5029 + }, + { + "epoch": 0.71, + "learning_rate": 5.293261740207456e-07, + "loss": 0.0028, + "reward": -0.2433, + "step": 5039 + }, + { + "epoch": 0.71, + "learning_rate": 4.902055591075355e-07, + "loss": 0.0031, + "reward": -0.2965, + "step": 5049 + }, + { + "epoch": 0.72, + "learning_rate": 4.525120745397493e-07, + "loss": 0.0029, + "reward": -0.1276, + "step": 5059 + }, + { + "epoch": 0.72, + "learning_rate": 4.1625764846984276e-07, + "loss": 0.0031, + "reward": -0.1481, + "step": 5069 + }, + { + "epoch": 0.72, + "learning_rate": 3.814537536583318e-07, + "loss": 0.0028, + "reward": -0.1388, + "step": 5079 + }, + { + "epoch": 0.72, + "learning_rate": 3.481114038432176e-07, + "loss": 0.003, + "reward": -0.2624, + "step": 5089 + }, + { + "epoch": 0.72, + "learning_rate": 3.1624115025468695e-07, + "loss": 0.0029, + "reward": -0.0321, + "step": 5099 + }, + { + "epoch": 0.72, + "learning_rate": 2.8585307827613764e-07, + "loss": 0.0029, + "reward": -0.2161, + "step": 5109 + }, + { + "epoch": 0.72, + "learning_rate": 2.569568042526721e-07, + "loss": 0.0035, + "reward": -0.2493, + "step": 5119 + }, + { + "epoch": 0.73, + "learning_rate": 2.2956147244796946e-07, + "loss": 0.0031, + "reward": -0.1123, + "step": 5129 + }, + { + "epoch": 0.73, + "learning_rate": 2.0367575215059222e-07, + "loss": 0.0031, + "reward": -0.1892, + "step": 5139 + }, + { + "epoch": 0.73, + "learning_rate": 1.7930783493055936e-07, + "loss": 0.0031, + "reward": -0.3653, + "step": 5149 + }, + { + "epoch": 0.73, + "learning_rate": 1.5646543204712595e-07, + "loss": 0.003, + "reward": -0.1532, + "step": 5159 + }, + { + "epoch": 0.73, + "learning_rate": 1.3515577200853946e-07, + "loss": 0.0031, + "reward": -0.2271, + "step": 5169 + }, + { + "epoch": 0.73, + "learning_rate": 1.1538559828457586e-07, + "loss": 0.0033, + "reward": -0.1938, + "step": 5179 + }, + { + "epoch": 0.73, + "learning_rate": 9.716116717254698e-08, + "loss": 0.003, + "reward": -0.2875, + "step": 5189 + }, + { + "epoch": 0.74, + "learning_rate": 8.048824581750325e-08, + "loss": 0.0032, + "reward": -0.1349, + "step": 5199 + }, + { + "epoch": 0.74, + "learning_rate": 6.537211038719571e-08, + "loss": 0.0027, + "reward": -0.1755, + "step": 5209 + }, + { + "epoch": 0.74, + "learning_rate": 5.1817544402442686e-08, + "loss": 0.0033, + "reward": -0.1694, + "step": 5219 + }, + { + "epoch": 0.74, + "learning_rate": 3.9828837223365166e-08, + "loss": 0.0027, + "reward": -0.1913, + "step": 5229 + }, + { + "epoch": 0.74, + "learning_rate": 2.9409782692019218e-08, + "loss": 0.0032, + "reward": -0.2301, + "step": 5239 + }, + { + "epoch": 0.74, + "learning_rate": 2.056367793183134e-08, + "loss": 0.0032, + "reward": -0.3049, + "step": 5249 + }, + { + "epoch": 0.74, + "learning_rate": 1.3293322304213652e-08, + "loss": 0.0034, + "reward": -0.2132, + "step": 5259 + }, + { + "epoch": 0.75, + "learning_rate": 7.601016522708616e-09, + "loss": 0.0031, + "reward": -0.2705, + "step": 5269 + }, + { + "epoch": 0.75, + "learning_rate": 3.4885619249203086e-09, + "loss": 0.0031, + "reward": -0.1178, + "step": 5279 + }, + { + "epoch": 0.75, + "learning_rate": 9.572599024820773e-10, + "loss": 0.0031, + "reward": -0.1919, + "step": 5289 + }, + { + "epoch": 0.75, + "learning_rate": 7.911489227074853e-12, + "loss": 0.0029, + "reward": -0.0784, + "step": 5299 + }, + { + "epoch": 0.75, + "learning_rate": 6.408171077015856e-10, + "loss": 0.0031, + "reward": -0.1285, + "step": 5309 + }, + { + "epoch": 0.75, + "learning_rate": 2.8557764740955172e-09, + "loss": 0.0031, + "reward": -0.1184, + "step": 5319 + }, + { + "epoch": 0.75, + "learning_rate": 6.652088661621703e-09, + "loss": 0.003, + "reward": -0.2125, + "step": 5329 + }, + { + "epoch": 0.76, + "learning_rate": 1.2028552322327358e-08, + "loss": 0.004, + "reward": -0.202, + "step": 5339 + }, + { + "epoch": 0.76, + "learning_rate": 1.898346606725887e-08, + "loss": 0.0032, + "reward": -0.206, + "step": 5349 + }, + { + "epoch": 0.76, + "learning_rate": 2.7514629004871673e-08, + "loss": 0.0033, + "reward": -0.2027, + "step": 5359 + }, + { + "epoch": 0.76, + "learning_rate": 3.761934143750256e-08, + "loss": 0.0044, + "reward": -0.2893, + "step": 5369 + }, + { + "epoch": 0.76, + "learning_rate": 4.9294405715696324e-08, + "loss": 0.0032, + "reward": -0.1786, + "step": 5379 + }, + { + "epoch": 0.76, + "learning_rate": 6.253612725009962e-08, + "loss": 0.0033, + "reward": -0.26, + "step": 5389 + }, + { + "epoch": 0.76, + "learning_rate": 7.734031568062683e-08, + "loss": 0.0024, + "reward": -0.2568, + "step": 5399 + }, + { + "epoch": 0.77, + "learning_rate": 9.370228620249778e-08, + "loss": 0.0037, + "reward": -0.1439, + "step": 5409 + }, + { + "epoch": 0.77, + "learning_rate": 1.116168610487578e-07, + "loss": 0.0028, + "reward": -0.2807, + "step": 5419 + }, + { + "epoch": 0.77, + "learning_rate": 1.3107837112877664e-07, + "loss": 0.0032, + "reward": -0.2143, + "step": 5429 + }, + { + "epoch": 0.77, + "learning_rate": 1.5208065782225667e-07, + "loss": 0.0031, + "reward": -0.2846, + "step": 5439 + }, + { + "epoch": 0.77, + "learning_rate": 1.7461707492811786e-07, + "loss": 0.0032, + "reward": -0.2704, + "step": 5449 + }, + { + "epoch": 0.77, + "learning_rate": 1.9868049076771478e-07, + "loss": 0.0035, + "reward": -0.2247, + "step": 5459 + }, + { + "epoch": 0.77, + "learning_rate": 2.2426329044164808e-07, + "loss": 0.0032, + "reward": -0.1316, + "step": 5469 + }, + { + "epoch": 0.78, + "learning_rate": 2.5135737823952457e-07, + "loss": 0.0033, + "reward": -0.1427, + "step": 5479 + }, + { + "epoch": 0.78, + "learning_rate": 2.7995418020185016e-07, + "loss": 0.0029, + "reward": -0.2073, + "step": 5489 + }, + { + "epoch": 0.78, + "learning_rate": 3.100446468332596e-07, + "loss": 0.0026, + "reward": -0.1949, + "step": 5499 + }, + { + "epoch": 0.78, + "learning_rate": 3.41619255966264e-07, + "loss": 0.0028, + "reward": -0.2821, + "step": 5509 + }, + { + "epoch": 0.78, + "learning_rate": 3.746680157745258e-07, + "loss": 0.0029, + "reward": -0.1413, + "step": 5519 + }, + { + "epoch": 0.78, + "learning_rate": 4.091804679348144e-07, + "loss": 0.0032, + "reward": -0.2282, + "step": 5529 + }, + { + "epoch": 0.78, + "learning_rate": 4.451456909365265e-07, + "loss": 0.003, + "reward": -0.1473, + "step": 5539 + }, + { + "epoch": 0.79, + "learning_rate": 4.825523035378365e-07, + "loss": 0.0032, + "reward": -0.1949, + "step": 5549 + }, + { + "epoch": 0.79, + "learning_rate": 5.213884683672954e-07, + "loss": 0.0041, + "reward": -0.0118, + "step": 5559 + }, + { + "epoch": 0.79, + "learning_rate": 5.61641895669785e-07, + "loss": 0.0031, + "reward": -0.1958, + "step": 5569 + }, + { + "epoch": 0.79, + "learning_rate": 6.03299847195613e-07, + "loss": 0.003, + "reward": -0.0907, + "step": 5579 + }, + { + "epoch": 0.79, + "learning_rate": 6.46349140231578e-07, + "loss": 0.0032, + "reward": -0.1633, + "step": 5589 + }, + { + "epoch": 0.79, + "learning_rate": 6.907761517726225e-07, + "loss": 0.0037, + "reward": -0.3335, + "step": 5599 + }, + { + "epoch": 0.79, + "learning_rate": 7.365668228328832e-07, + "loss": 0.0032, + "reward": -0.2729, + "step": 5609 + }, + { + "epoch": 0.8, + "learning_rate": 7.837066628946427e-07, + "loss": 0.004, + "reward": -0.2201, + "step": 5619 + }, + { + "epoch": 0.8, + "learning_rate": 8.321807544939037e-07, + "loss": 0.0035, + "reward": -0.1243, + "step": 5629 + }, + { + "epoch": 0.8, + "learning_rate": 8.819737579410198e-07, + "loss": 0.003, + "reward": -0.1845, + "step": 5639 + }, + { + "epoch": 0.8, + "learning_rate": 9.33069916174974e-07, + "loss": 0.0032, + "reward": -0.2037, + "step": 5649 + }, + { + "epoch": 0.8, + "learning_rate": 9.854530597496953e-07, + "loss": 0.0031, + "reward": -0.0922, + "step": 5659 + }, + { + "epoch": 0.8, + "learning_rate": 1.039106611950943e-06, + "loss": 0.0025, + "reward": -0.2618, + "step": 5669 + }, + { + "epoch": 0.8, + "learning_rate": 1.0940135940419828e-06, + "loss": 0.003, + "reward": -0.1229, + "step": 5679 + }, + { + "epoch": 0.81, + "learning_rate": 1.1501566306365758e-06, + "loss": 0.0029, + "reward": -0.0647, + "step": 5689 + }, + { + "epoch": 0.81, + "learning_rate": 1.2075179551973986e-06, + "loss": 0.003, + "reward": -0.1913, + "step": 5699 + }, + { + "epoch": 0.81, + "learning_rate": 1.2660794156583233e-06, + "loss": 0.0028, + "reward": -0.1541, + "step": 5709 + }, + { + "epoch": 0.81, + "learning_rate": 1.3258224801686503e-06, + "loss": 0.0033, + "reward": -0.1554, + "step": 5719 + }, + { + "epoch": 0.81, + "learning_rate": 1.3867282429575152e-06, + "loss": 0.0041, + "reward": -0.3137, + "step": 5729 + }, + { + "epoch": 0.81, + "learning_rate": 1.4487774303166875e-06, + "loss": 0.0033, + "reward": -0.2465, + "step": 5739 + }, + { + "epoch": 0.81, + "learning_rate": 1.511950406699712e-06, + "loss": 0.0038, + "reward": -0.2697, + "step": 5749 + }, + { + "epoch": 0.82, + "learning_rate": 1.576227180935655e-06, + "loss": 0.0032, + "reward": -0.155, + "step": 5759 + }, + { + "epoch": 0.82, + "learning_rate": 1.641587412555281e-06, + "loss": 0.0026, + "reward": -0.128, + "step": 5769 + }, + { + "epoch": 0.82, + "learning_rate": 1.7080104182278716e-06, + "loss": 0.0036, + "reward": -0.1322, + "step": 5779 + }, + { + "epoch": 0.82, + "learning_rate": 1.7754751783064622e-06, + "loss": 0.0036, + "reward": -0.2405, + "step": 5789 + }, + { + "epoch": 0.82, + "learning_rate": 1.8439603434795516e-06, + "loss": 0.0032, + "reward": -0.1742, + "step": 5799 + }, + { + "epoch": 0.82, + "learning_rate": 1.9134442415270926e-06, + "loss": 0.003, + "reward": -0.1415, + "step": 5809 + }, + { + "epoch": 0.82, + "learning_rate": 1.983904884178742e-06, + "loss": 0.0027, + "reward": -0.3485, + "step": 5819 + }, + { + "epoch": 0.83, + "learning_rate": 2.0553199740720214e-06, + "loss": 0.0033, + "reward": -0.2301, + "step": 5829 + }, + { + "epoch": 0.83, + "learning_rate": 2.1276669118084043e-06, + "loss": 0.0038, + "reward": -0.419, + "step": 5839 + }, + { + "epoch": 0.83, + "learning_rate": 2.200922803104868e-06, + "loss": 0.0028, + "reward": -0.1832, + "step": 5849 + }, + { + "epoch": 0.83, + "learning_rate": 2.2750644660388675e-06, + "loss": 0.0028, + "reward": -0.1299, + "step": 5859 + }, + { + "epoch": 0.83, + "learning_rate": 2.3500684383842605e-06, + "loss": 0.0027, + "reward": -0.0986, + "step": 5869 + }, + { + "epoch": 0.83, + "learning_rate": 2.4259109850359695e-06, + "loss": 0.0027, + "reward": -0.1309, + "step": 5879 + }, + { + "epoch": 0.83, + "learning_rate": 2.502568105520961e-06, + "loss": 0.0034, + "reward": -0.1672, + "step": 5889 + }, + { + "epoch": 0.84, + "learning_rate": 2.580015541593277e-06, + "loss": 0.0031, + "reward": -0.1751, + "step": 5899 + }, + { + "epoch": 0.84, + "learning_rate": 2.6582287849105274e-06, + "loss": 0.0031, + "reward": -0.2151, + "step": 5909 + }, + { + "epoch": 0.84, + "learning_rate": 2.737183084789651e-06, + "loss": 0.0029, + "reward": -0.1455, + "step": 5919 + }, + { + "epoch": 0.84, + "learning_rate": 2.816853456039244e-06, + "loss": 0.0026, + "reward": -0.1059, + "step": 5929 + }, + { + "epoch": 0.84, + "learning_rate": 2.8972146868661828e-06, + "loss": 0.0028, + "reward": -0.1925, + "step": 5939 + }, + { + "epoch": 0.84, + "learning_rate": 2.9782413468539417e-06, + "loss": 0.0028, + "reward": -0.3239, + "step": 5949 + }, + { + "epoch": 0.84, + "learning_rate": 3.0599077950100608e-06, + "loss": 0.0039, + "reward": -0.2807, + "step": 5959 + }, + { + "epoch": 0.85, + "learning_rate": 3.1421881878802864e-06, + "loss": 0.0028, + "reward": -0.2573, + "step": 5969 + }, + { + "epoch": 0.85, + "learning_rate": 3.225056487726732e-06, + "loss": 0.003, + "reward": -0.2115, + "step": 5979 + }, + { + "epoch": 0.85, + "learning_rate": 3.308486470767613e-06, + "loss": 0.0028, + "reward": -0.1847, + "step": 5989 + }, + { + "epoch": 0.85, + "learning_rate": 3.3924517354757315e-06, + "loss": 0.0027, + "reward": -0.1512, + "step": 5999 + }, + { + "epoch": 0.85, + "learning_rate": 3.476925710933339e-06, + "loss": 0.0031, + "reward": -0.0941, + "step": 6009 + }, + { + "epoch": 0.85, + "learning_rate": 3.5618816652404714e-06, + "loss": 0.0033, + "reward": -0.2708, + "step": 6019 + }, + { + "epoch": 0.85, + "learning_rate": 3.6472927139743546e-06, + "loss": 0.0024, + "reward": -0.1351, + "step": 6029 + }, + { + "epoch": 0.86, + "learning_rate": 3.7331318286969787e-06, + "loss": 0.003, + "reward": -0.2288, + "step": 6039 + }, + { + "epoch": 0.86, + "learning_rate": 3.819371845508301e-06, + "loss": 0.0025, + "reward": -0.1268, + "step": 6049 + }, + { + "epoch": 0.86, + "learning_rate": 3.9059854736422616e-06, + "loss": 0.0035, + "reward": -0.1775, + "step": 6059 + }, + { + "epoch": 0.86, + "learning_rate": 3.992945304103046e-06, + "loss": 0.0029, + "reward": -0.1164, + "step": 6069 + }, + { + "epoch": 0.86, + "learning_rate": 4.080223818338627e-06, + "loss": 0.003, + "reward": -0.3306, + "step": 6079 + }, + { + "epoch": 0.86, + "learning_rate": 4.16779339694911e-06, + "loss": 0.0029, + "reward": -0.124, + "step": 6089 + }, + { + "epoch": 0.86, + "learning_rate": 4.25562632842687e-06, + "loss": 0.0029, + "reward": -0.1823, + "step": 6099 + }, + { + "epoch": 0.86, + "learning_rate": 4.343694817925945e-06, + "loss": 0.0026, + "reward": -0.2144, + "step": 6109 + }, + { + "epoch": 0.87, + "learning_rate": 4.4319709960577205e-06, + "loss": 0.0028, + "reward": -0.0664, + "step": 6119 + }, + { + "epoch": 0.87, + "learning_rate": 4.520426927710255e-06, + "loss": 0.0027, + "reward": -0.1177, + "step": 6129 + }, + { + "epoch": 0.87, + "learning_rate": 4.609034620888349e-06, + "loss": 0.0034, + "reward": -0.135, + "step": 6139 + }, + { + "epoch": 0.87, + "learning_rate": 4.697766035571671e-06, + "loss": 0.0043, + "reward": -0.3131, + "step": 6149 + }, + { + "epoch": 0.87, + "learning_rate": 4.786593092588086e-06, + "loss": 0.0024, + "reward": -0.234, + "step": 6159 + }, + { + "epoch": 0.87, + "learning_rate": 4.875487682499278e-06, + "loss": 0.0027, + "reward": -0.0573, + "step": 6169 + }, + { + "epoch": 0.87, + "learning_rate": 4.96442167449609e-06, + "loss": 0.0034, + "reward": -0.1771, + "step": 6179 + }, + { + "epoch": 0.88, + "learning_rate": 5.053366925300511e-06, + "loss": 0.0028, + "reward": -0.1481, + "step": 6189 + }, + { + "epoch": 0.88, + "learning_rate": 5.142295288071675e-06, + "loss": 0.0041, + "reward": -0.2635, + "step": 6199 + }, + { + "epoch": 0.88, + "learning_rate": 5.2311786213129315e-06, + "loss": 0.003, + "reward": -0.1914, + "step": 6209 + }, + { + "epoch": 0.88, + "learning_rate": 5.319988797777316e-06, + "loss": 0.0027, + "reward": -0.181, + "step": 6219 + }, + { + "epoch": 0.88, + "learning_rate": 5.408697713368388e-06, + "loss": 0.0028, + "reward": -0.1659, + "step": 6229 + }, + { + "epoch": 0.88, + "learning_rate": 5.4972772960338784e-06, + "loss": 0.0024, + "reward": -0.0837, + "step": 6239 + }, + { + "epoch": 0.88, + "learning_rate": 5.585699514649057e-06, + "loss": 0.003, + "reward": -0.1156, + "step": 6249 + }, + { + "epoch": 0.89, + "learning_rate": 5.6739363878872754e-06, + "loss": 0.003, + "reward": -0.1918, + "step": 6259 + }, + { + "epoch": 0.89, + "learning_rate": 5.761959993074669e-06, + "loss": 0.0027, + "reward": -0.2119, + "step": 6269 + }, + { + "epoch": 0.89, + "learning_rate": 5.84974247502633e-06, + "loss": 0.0031, + "reward": -0.1654, + "step": 6279 + }, + { + "epoch": 0.89, + "learning_rate": 5.93725605486109e-06, + "loss": 0.0029, + "reward": -0.1048, + "step": 6289 + }, + { + "epoch": 0.89, + "learning_rate": 6.024473038792242e-06, + "loss": 0.0029, + "reward": -0.1743, + "step": 6299 + }, + { + "epoch": 0.89, + "learning_rate": 6.1113658268912065e-06, + "loss": 0.0028, + "reward": -0.1883, + "step": 6309 + }, + { + "epoch": 0.89, + "learning_rate": 6.197906921821632e-06, + "loss": 0.0027, + "reward": -0.1351, + "step": 6319 + }, + { + "epoch": 0.9, + "learning_rate": 6.284068937540894e-06, + "loss": 0.0027, + "reward": -0.1687, + "step": 6329 + }, + { + "epoch": 0.9, + "learning_rate": 6.369824607966508e-06, + "loss": 0.0028, + "reward": -0.1027, + "step": 6339 + }, + { + "epoch": 0.9, + "learning_rate": 6.455146795604479e-06, + "loss": 0.0028, + "reward": -0.0773, + "step": 6349 + }, + { + "epoch": 0.9, + "learning_rate": 6.5400085001370186e-06, + "loss": 0.0025, + "reward": -0.2412, + "step": 6359 + }, + { + "epoch": 0.9, + "learning_rate": 6.624382866966794e-06, + "loss": 0.003, + "reward": -0.1633, + "step": 6369 + }, + { + "epoch": 0.9, + "learning_rate": 6.708243195715136e-06, + "loss": 0.0026, + "reward": -0.2322, + "step": 6379 + }, + { + "epoch": 0.9, + "learning_rate": 6.791562948671414e-06, + "loss": 0.0032, + "reward": -0.1261, + "step": 6389 + }, + { + "epoch": 0.91, + "learning_rate": 6.874315759190886e-06, + "loss": 0.0025, + "reward": -0.1441, + "step": 6399 + }, + { + "epoch": 0.91, + "learning_rate": 6.956475440038507e-06, + "loss": 0.0031, + "reward": -0.0489, + "step": 6409 + }, + { + "epoch": 0.91, + "learning_rate": 7.038015991675885e-06, + "loss": 0.0028, + "reward": -0.1033, + "step": 6419 + }, + { + "epoch": 0.91, + "learning_rate": 7.118911610488885e-06, + "loss": 0.0027, + "reward": -0.2106, + "step": 6429 + }, + { + "epoch": 0.91, + "learning_rate": 7.199136696953178e-06, + "loss": 0.0036, + "reward": -0.0478, + "step": 6439 + }, + { + "epoch": 0.91, + "learning_rate": 7.2786658637353125e-06, + "loss": 0.003, + "reward": -0.218, + "step": 6449 + }, + { + "epoch": 0.91, + "learning_rate": 7.357473943726493e-06, + "loss": 0.0026, + "reward": -0.0883, + "step": 6459 + }, + { + "epoch": 0.92, + "learning_rate": 7.435535998006814e-06, + "loss": 0.0034, + "reward": -0.2207, + "step": 6469 + }, + { + "epoch": 0.92, + "learning_rate": 7.512827323737152e-06, + "loss": 0.0033, + "reward": -0.192, + "step": 6479 + }, + { + "epoch": 0.92, + "learning_rate": 7.589323461976461e-06, + "loss": 0.0028, + "reward": -0.1123, + "step": 6489 + }, + { + "epoch": 0.92, + "learning_rate": 7.665000205421812e-06, + "loss": 0.0029, + "reward": -0.2671, + "step": 6499 + }, + { + "epoch": 0.92, + "learning_rate": 7.739833606068832e-06, + "loss": 0.0031, + "reward": -0.1165, + "step": 6509 + }, + { + "epoch": 0.92, + "learning_rate": 7.81379998279006e-06, + "loss": 0.0029, + "reward": -0.1378, + "step": 6519 + }, + { + "epoch": 0.92, + "learning_rate": 7.88687592882892e-06, + "loss": 0.0033, + "reward": -0.1337, + "step": 6529 + }, + { + "epoch": 0.93, + "learning_rate": 7.959038319206758e-06, + "loss": 0.0027, + "reward": -0.2007, + "step": 6539 + }, + { + "epoch": 0.93, + "learning_rate": 8.03026431804083e-06, + "loss": 0.0026, + "reward": -0.1243, + "step": 6549 + }, + { + "epoch": 0.93, + "learning_rate": 8.100531385770696e-06, + "loss": 0.0029, + "reward": -0.0918, + "step": 6559 + }, + { + "epoch": 0.93, + "learning_rate": 8.169817286290935e-06, + "loss": 0.0029, + "reward": -0.0355, + "step": 6569 + }, + { + "epoch": 0.93, + "learning_rate": 8.238100093987765e-06, + "loss": 0.0027, + "reward": -0.2479, + "step": 6579 + }, + { + "epoch": 0.93, + "learning_rate": 8.305358200677449e-06, + "loss": 0.0026, + "reward": -0.074, + "step": 6589 + }, + { + "epoch": 0.93, + "learning_rate": 8.371570322444209e-06, + "loss": 0.0029, + "reward": -0.0884, + "step": 6599 + }, + { + "epoch": 0.94, + "learning_rate": 8.436715506375557e-06, + "loss": 0.0028, + "reward": -0.1674, + "step": 6609 + }, + { + "epoch": 0.94, + "learning_rate": 8.500773137192906e-06, + "loss": 0.0035, + "reward": -0.2794, + "step": 6619 + }, + { + "epoch": 0.94, + "learning_rate": 8.56372294377524e-06, + "loss": 0.0027, + "reward": -0.1072, + "step": 6629 + }, + { + "epoch": 0.94, + "learning_rate": 8.625545005574002e-06, + "loss": 0.0023, + "reward": -0.0992, + "step": 6639 + }, + { + "epoch": 0.94, + "learning_rate": 8.686219758916918e-06, + "loss": 0.0029, + "reward": -0.1256, + "step": 6649 + }, + { + "epoch": 0.94, + "learning_rate": 8.745728003198991e-06, + "loss": 0.0039, + "reward": 0.0413, + "step": 6659 + }, + { + "epoch": 0.94, + "learning_rate": 8.804050906958537e-06, + "loss": 0.0026, + "reward": -0.1593, + "step": 6669 + }, + { + "epoch": 0.95, + "learning_rate": 8.861170013836436e-06, + "loss": 0.0031, + "reward": -0.0352, + "step": 6679 + }, + { + "epoch": 0.95, + "learning_rate": 8.917067248416647e-06, + "loss": 0.003, + "reward": -0.0722, + "step": 6689 + }, + { + "epoch": 0.95, + "learning_rate": 8.971724921946235e-06, + "loss": 0.0027, + "reward": -0.1898, + "step": 6699 + }, + { + "epoch": 0.95, + "learning_rate": 9.025125737932962e-06, + "loss": 0.003, + "reward": -0.1166, + "step": 6709 + }, + { + "epoch": 0.95, + "learning_rate": 9.077252797618818e-06, + "loss": 0.0024, + "reward": 0.0003, + "step": 6719 + }, + { + "epoch": 0.95, + "learning_rate": 9.128089605327627e-06, + "loss": 0.0028, + "reward": -0.0084, + "step": 6729 + }, + { + "epoch": 0.95, + "learning_rate": 9.177620073685139e-06, + "loss": 0.0025, + "reward": 0.0006, + "step": 6739 + }, + { + "epoch": 0.96, + "learning_rate": 9.225828528709911e-06, + "loss": 0.0025, + "reward": -0.0565, + "step": 6749 + }, + { + "epoch": 0.96, + "learning_rate": 9.27269971477334e-06, + "loss": 0.0027, + "reward": -0.2262, + "step": 6759 + }, + { + "epoch": 0.96, + "learning_rate": 9.318218799427321e-06, + "loss": 0.0024, + "reward": -0.2918, + "step": 6769 + }, + { + "epoch": 0.96, + "learning_rate": 9.362371378098033e-06, + "loss": 0.0027, + "reward": -0.1157, + "step": 6779 + }, + { + "epoch": 0.96, + "learning_rate": 9.405143478644232e-06, + "loss": 0.0031, + "reward": -0.1187, + "step": 6789 + }, + { + "epoch": 0.96, + "learning_rate": 9.446521565778804e-06, + "loss": 0.0028, + "reward": -0.0971, + "step": 6799 + }, + { + "epoch": 0.96, + "learning_rate": 9.486492545351985e-06, + "loss": 0.0029, + "reward": -0.0164, + "step": 6809 + }, + { + "epoch": 0.97, + "learning_rate": 9.525043768495047e-06, + "loss": 0.0029, + "reward": -0.2, + "step": 6819 + }, + { + "epoch": 0.97, + "learning_rate": 9.562163035623038e-06, + "loss": 0.0022, + "reward": 0.0569, + "step": 6829 + }, + { + "epoch": 0.97, + "learning_rate": 9.597838600295355e-06, + "loss": 0.0023, + "reward": -0.163, + "step": 6839 + }, + { + "epoch": 0.97, + "learning_rate": 9.632059172932935e-06, + "loss": 0.0027, + "reward": -0.1407, + "step": 6849 + }, + { + "epoch": 0.97, + "learning_rate": 9.664813924390828e-06, + "loss": 0.0026, + "reward": -0.1893, + "step": 6859 + }, + { + "epoch": 0.97, + "learning_rate": 9.696092489385132e-06, + "loss": 0.0027, + "reward": -0.0518, + "step": 6869 + }, + { + "epoch": 0.97, + "learning_rate": 9.72588496977306e-06, + "loss": 0.0026, + "reward": -0.1236, + "step": 6879 + }, + { + "epoch": 0.98, + "learning_rate": 9.754181937685261e-06, + "loss": 0.0026, + "reward": -0.2622, + "step": 6889 + }, + { + "epoch": 0.98, + "learning_rate": 9.780974438509254e-06, + "loss": 0.0025, + "reward": -0.1576, + "step": 6899 + }, + { + "epoch": 0.98, + "learning_rate": 9.80625399372313e-06, + "loss": 0.0036, + "reward": -0.0548, + "step": 6909 + }, + { + "epoch": 0.98, + "learning_rate": 9.8300126035786e-06, + "loss": 0.0037, + "reward": -0.219, + "step": 6919 + }, + { + "epoch": 0.98, + "learning_rate": 9.852242749632524e-06, + "loss": 0.0028, + "reward": -0.0597, + "step": 6929 + }, + { + "epoch": 0.98, + "learning_rate": 9.872937397126121e-06, + "loss": 0.0024, + "reward": -0.133, + "step": 6939 + }, + { + "epoch": 0.98, + "learning_rate": 9.89208999721115e-06, + "loss": 0.0027, + "reward": -0.0708, + "step": 6949 + }, + { + "epoch": 0.99, + "learning_rate": 9.909694489022273e-06, + "loss": 0.0026, + "reward": -0.0812, + "step": 6959 + }, + { + "epoch": 0.99, + "learning_rate": 9.92574530159505e-06, + "loss": 0.0031, + "reward": 0.0002, + "step": 6969 + }, + { + "epoch": 0.99, + "learning_rate": 9.940237355628861e-06, + "loss": 0.003, + "reward": 0.0289, + "step": 6979 + }, + { + "epoch": 0.99, + "learning_rate": 9.95316606509427e-06, + "loss": 0.0029, + "reward": -0.0353, + "step": 6989 + }, + { + "epoch": 0.99, + "learning_rate": 9.964527338684262e-06, + "loss": 0.0023, + "reward": -0.0618, + "step": 6999 + }, + { + "epoch": 0.99, + "learning_rate": 9.974317581108963e-06, + "loss": 0.003, + "reward": -0.1512, + "step": 7009 + }, + { + "epoch": 0.99, + "learning_rate": 9.98253369423336e-06, + "loss": 0.0032, + "reward": 0.0394, + "step": 7019 + }, + { + "epoch": 1.0, + "learning_rate": 9.989173078057715e-06, + "loss": 0.0027, + "reward": -0.081, + "step": 7029 + }, + { + "epoch": 1.0, + "learning_rate": 9.99423363154034e-06, + "loss": 0.0028, + "reward": -0.0309, + "step": 7039 + }, + { + "epoch": 1.0, + "learning_rate": 9.99771375326247e-06, + "loss": 0.0025, + "reward": -0.1167, + "step": 7049 + }, + { + "epoch": 1.0, + "learning_rate": 9.999612341935039e-06, + "loss": 0.0024, + "reward": -0.0893, + "step": 7059 + } + ], + "max_steps": 7063, + "num_train_epochs": 1.0, + "total_flos": 0, + "trial_name": null, + "trial_params": null +} diff --git a/ppo-lora/training_args.bin b/ppo-lora/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..684a2089f53ed437a099eb02bb62cc1ce00d3664 --- /dev/null +++ b/ppo-lora/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf91d7ac2ddda7e1272b902408951545188f843d4da6b19c2e572a6c86a6075b +size 3274 diff --git a/ppo-lora/training_loss.png b/ppo-lora/training_loss.png new file mode 100644 index 0000000000000000000000000000000000000000..35f0cf6563291f7834e3fd8e87ed1bfbc39a561d Binary files /dev/null and b/ppo-lora/training_loss.png differ diff --git a/ppo-lora/training_reward.png b/ppo-lora/training_reward.png new file mode 100644 index 0000000000000000000000000000000000000000..3a338292915945795287b7f88e54e959dd6af366 Binary files /dev/null and b/ppo-lora/training_reward.png differ diff --git a/ppo-lora/value_head.bin b/ppo-lora/value_head.bin new file mode 100644 index 0000000000000000000000000000000000000000..5c4b6b6ef79f1a12b355dffd15a36230f20ea20a --- /dev/null +++ b/ppo-lora/value_head.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2c700d9b9107a021388083afe3ae14636cd89a51c49e8a848a763f9e73d12c5 +size 21491 diff --git a/rm-lora/README.md b/rm-lora/README.md new file mode 100644 index 0000000000000000000000000000000000000000..d290c902d52b2091d490255d35c9be86df84f437 --- /dev/null +++ b/rm-lora/README.md @@ -0,0 +1,3 @@ +--- +library_name: peft +--- diff --git a/rm-lora/adapter_config.json b/rm-lora/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..2ef4676864a7f782259cd6700dcab8059e8973ab --- /dev/null +++ b/rm-lora/adapter_config.json @@ -0,0 +1,20 @@ +{ + "base_model_name_or_path": "llama-13b-hf/", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layers_pattern": null, + "layers_to_transform": null, + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "revision": null, + "target_modules": [ + "q_proj", + "v_proj" + ], + "task_type": "CAUSAL_LM" +} \ No newline at end of file diff --git a/rm-lora/adapter_model.bin b/rm-lora/adapter_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..7cca15b6fb657cf1885da1a52d6b99730215281a --- /dev/null +++ b/rm-lora/adapter_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e888a52313595cd14955b529744065dcdeed37dc6bbc48f39bc754c9cead9e56 +size 26269517 diff --git a/rm-lora/all_results.json b/rm-lora/all_results.json new file mode 100644 index 0000000000000000000000000000000000000000..1924164376d19dea349e0ccfe367ad7155d717fd --- /dev/null +++ b/rm-lora/all_results.json @@ -0,0 +1,7 @@ +{ + "epoch": 1.0, + "train_loss": 0.21165546916281192, + "train_runtime": 6592.6141, + "train_samples_per_second": 5.528, + "train_steps_per_second": 0.086 +} \ No newline at end of file diff --git a/rm-lora/finetuning_args.json b/rm-lora/finetuning_args.json new file mode 100644 index 0000000000000000000000000000000000000000..36a921b3eb84159ad54e7697e9d7d3e2fde38fec --- /dev/null +++ b/rm-lora/finetuning_args.json @@ -0,0 +1,13 @@ +{ + "finetuning_type": "lora", + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "lora_rank": 8, + "lora_target": [ + "q_proj", + "v_proj" + ], + "name_module_trainable": "mlp", + "num_hidden_layers": 32, + "num_layer_trainable": 3 +} diff --git a/rm-lora/train_results.json b/rm-lora/train_results.json new file mode 100644 index 0000000000000000000000000000000000000000..1924164376d19dea349e0ccfe367ad7155d717fd --- /dev/null +++ b/rm-lora/train_results.json @@ -0,0 +1,7 @@ +{ + "epoch": 1.0, + "train_loss": 0.21165546916281192, + "train_runtime": 6592.6141, + "train_samples_per_second": 5.528, + "train_steps_per_second": 0.086 +} \ No newline at end of file diff --git a/rm-lora/trainer_log.jsonl b/rm-lora/trainer_log.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..a2b33778dba01c7ff8adb69b133329d9b2acb1ec --- /dev/null +++ b/rm-lora/trainer_log.jsonl @@ -0,0 +1,224 @@ +{"current_steps": 10, "total_steps": 569, "loss": 0.6949, "reward": null, "learning_rate": 9.997256670306478e-06, "epoch": 0.02, "percentage": 1.76, "elapsed_time": "0:02:05", "remaining_time": "1:56:58"} +{"current_steps": 10, "total_steps": 569, "loss": 0.6949, "reward": null, "learning_rate": 9.997256670306478e-06, "epoch": 0.02, "percentage": 1.76, "elapsed_time": "0:02:05", "remaining_time": "1:56:59"} +{"current_steps": 10, "total_steps": 569, "loss": 0.6949, "reward": null, "learning_rate": 9.997256670306478e-06, "epoch": 0.02, "percentage": 1.76, "elapsed_time": "0:02:05", "remaining_time": "1:56:58"} +{"current_steps": 10, "total_steps": 569, "loss": 0.6949, "reward": null, "learning_rate": 9.997256670306478e-06, "epoch": 0.02, "percentage": 1.76, "elapsed_time": "0:02:05", "remaining_time": "1:56:58"} +{"current_steps": 20, "total_steps": 569, "loss": 0.6937, "reward": null, "learning_rate": 9.980502778148438e-06, "epoch": 0.04, "percentage": 3.51, "elapsed_time": "0:03:57", "remaining_time": "1:48:50"} +{"current_steps": 20, "total_steps": 569, "loss": 0.6937, "reward": null, "learning_rate": 9.980502778148438e-06, "epoch": 0.04, "percentage": 3.51, "elapsed_time": "0:03:57", "remaining_time": "1:48:50"} +{"current_steps": 20, "total_steps": 569, "loss": 0.6937, "reward": null, "learning_rate": 9.980502778148438e-06, "epoch": 0.04, "percentage": 3.51, "elapsed_time": "0:03:57", "remaining_time": "1:48:50"} +{"current_steps": 20, "total_steps": 569, "loss": 0.6937, "reward": null, "learning_rate": 9.980502778148438e-06, "epoch": 0.04, "percentage": 3.51, "elapsed_time": "0:03:57", "remaining_time": "1:48:50"} +{"current_steps": 30, "total_steps": 569, "loss": 0.6942, "reward": null, "learning_rate": 9.948570063910216e-06, "epoch": 0.05, "percentage": 5.27, "elapsed_time": "0:05:54", "remaining_time": "1:46:00"} +{"current_steps": 30, "total_steps": 569, "loss": 0.6942, "reward": null, "learning_rate": 9.948570063910216e-06, "epoch": 0.05, "percentage": 5.27, "elapsed_time": "0:05:54", "remaining_time": "1:46:00"} +{"current_steps": 30, "total_steps": 569, "loss": 0.6942, "reward": null, "learning_rate": 9.948570063910216e-06, "epoch": 0.05, "percentage": 5.27, "elapsed_time": "0:05:54", "remaining_time": "1:46:00"} +{"current_steps": 30, "total_steps": 569, "loss": 0.6942, "reward": null, "learning_rate": 9.948570063910216e-06, "epoch": 0.05, "percentage": 5.27, "elapsed_time": "0:05:54", "remaining_time": "1:46:00"} +{"current_steps": 40, "total_steps": 569, "loss": 0.6937, "reward": null, "learning_rate": 9.901555847282123e-06, "epoch": 0.07, "percentage": 7.03, "elapsed_time": "0:07:53", "remaining_time": "1:44:22"} +{"current_steps": 40, "total_steps": 569, "loss": 0.6937, "reward": null, "learning_rate": 9.901555847282123e-06, "epoch": 0.07, "percentage": 7.03, "elapsed_time": "0:07:53", "remaining_time": "1:44:22"} +{"current_steps": 40, "total_steps": 569, "loss": 0.6937, "reward": null, "learning_rate": 9.901555847282123e-06, "epoch": 0.07, "percentage": 7.03, "elapsed_time": "0:07:53", "remaining_time": "1:44:22"} +{"current_steps": 40, "total_steps": 569, "loss": 0.6937, "reward": null, "learning_rate": 9.901555847282123e-06, "epoch": 0.07, "percentage": 7.03, "elapsed_time": "0:07:53", "remaining_time": "1:44:22"} +{"current_steps": 50, "total_steps": 569, "loss": 0.675, "reward": null, "learning_rate": 9.839603411073388e-06, "epoch": 0.09, "percentage": 8.79, "elapsed_time": "0:09:47", "remaining_time": "1:41:39"} +{"current_steps": 50, "total_steps": 569, "loss": 0.675, "reward": null, "learning_rate": 9.839603411073388e-06, "epoch": 0.09, "percentage": 8.79, "elapsed_time": "0:09:47", "remaining_time": "1:41:39"} +{"current_steps": 50, "total_steps": 569, "loss": 0.675, "reward": null, "learning_rate": 9.839603411073388e-06, "epoch": 0.09, "percentage": 8.79, "elapsed_time": "0:09:47", "remaining_time": "1:41:39"} +{"current_steps": 50, "total_steps": 569, "loss": 0.675, "reward": null, "learning_rate": 9.839603411073388e-06, "epoch": 0.09, "percentage": 8.79, "elapsed_time": "0:09:47", "remaining_time": "1:41:39"} +{"current_steps": 60, "total_steps": 569, "loss": 0.657, "reward": null, "learning_rate": 9.762901564536523e-06, "epoch": 0.11, "percentage": 10.54, "elapsed_time": "0:11:45", "remaining_time": "1:39:45"} +{"current_steps": 60, "total_steps": 569, "loss": 0.657, "reward": null, "learning_rate": 9.762901564536523e-06, "epoch": 0.11, "percentage": 10.54, "elapsed_time": "0:11:45", "remaining_time": "1:39:45"} +{"current_steps": 60, "total_steps": 569, "loss": 0.657, "reward": null, "learning_rate": 9.762901564536523e-06, "epoch": 0.11, "percentage": 10.54, "elapsed_time": "0:11:45", "remaining_time": "1:39:45"} +{"current_steps": 60, "total_steps": 569, "loss": 0.657, "reward": null, "learning_rate": 9.762901564536523e-06, "epoch": 0.11, "percentage": 10.54, "elapsed_time": "0:11:45", "remaining_time": "1:39:45"} +{"current_steps": 70, "total_steps": 569, "loss": 0.6437, "reward": null, "learning_rate": 9.671684067943056e-06, "epoch": 0.12, "percentage": 12.3, "elapsed_time": "0:13:39", "remaining_time": "1:37:21"} +{"current_steps": 70, "total_steps": 569, "loss": 0.6437, "reward": null, "learning_rate": 9.671684067943056e-06, "epoch": 0.12, "percentage": 12.3, "elapsed_time": "0:13:39", "remaining_time": "1:37:21"} +{"current_steps": 70, "total_steps": 569, "loss": 0.6437, "reward": null, "learning_rate": 9.671684067943056e-06, "epoch": 0.12, "percentage": 12.3, "elapsed_time": "0:13:39", "remaining_time": "1:37:21"} +{"current_steps": 70, "total_steps": 569, "loss": 0.6437, "reward": null, "learning_rate": 9.671684067943056e-06, "epoch": 0.12, "percentage": 12.3, "elapsed_time": "0:13:39", "remaining_time": "1:37:21"} +{"current_steps": 80, "total_steps": 569, "loss": 0.6067, "reward": null, "learning_rate": 9.566228920164405e-06, "epoch": 0.14, "percentage": 14.06, "elapsed_time": "0:15:36", "remaining_time": "1:35:23"} +{"current_steps": 80, "total_steps": 569, "loss": 0.6067, "reward": null, "learning_rate": 9.566228920164405e-06, "epoch": 0.14, "percentage": 14.06, "elapsed_time": "0:15:36", "remaining_time": "1:35:23"} +{"current_steps": 80, "total_steps": 569, "loss": 0.6067, "reward": null, "learning_rate": 9.566228920164405e-06, "epoch": 0.14, "percentage": 14.06, "elapsed_time": "0:15:36", "remaining_time": "1:35:23"} +{"current_steps": 80, "total_steps": 569, "loss": 0.6067, "reward": null, "learning_rate": 9.566228920164405e-06, "epoch": 0.14, "percentage": 14.06, "elapsed_time": "0:15:36", "remaining_time": "1:35:23"} +{"current_steps": 90, "total_steps": 569, "loss": 0.5389, "reward": null, "learning_rate": 9.446857511429e-06, "epoch": 0.16, "percentage": 15.82, "elapsed_time": "0:17:33", "remaining_time": "1:33:26"} +{"current_steps": 90, "total_steps": 569, "loss": 0.5389, "reward": null, "learning_rate": 9.446857511429e-06, "epoch": 0.16, "percentage": 15.82, "elapsed_time": "0:17:33", "remaining_time": "1:33:26"} +{"current_steps": 90, "total_steps": 569, "loss": 0.5389, "reward": null, "learning_rate": 9.446857511429e-06, "epoch": 0.16, "percentage": 15.82, "elapsed_time": "0:17:33", "remaining_time": "1:33:26"} +{"current_steps": 90, "total_steps": 569, "loss": 0.5389, "reward": null, "learning_rate": 9.446857511429e-06, "epoch": 0.16, "percentage": 15.82, "elapsed_time": "0:17:33", "remaining_time": "1:33:26"} +{"current_steps": 100, "total_steps": 569, "loss": 0.3593, "reward": null, "learning_rate": 9.313933643837825e-06, "epoch": 0.18, "percentage": 17.57, "elapsed_time": "0:19:33", "remaining_time": "1:31:46"} +{"current_steps": 100, "total_steps": 569, "loss": 0.3593, "reward": null, "learning_rate": 9.313933643837825e-06, "epoch": 0.18, "percentage": 17.57, "elapsed_time": "0:19:33", "remaining_time": "1:31:46"} +{"current_steps": 100, "total_steps": 569, "loss": 0.3593, "reward": null, "learning_rate": 9.313933643837825e-06, "epoch": 0.18, "percentage": 17.57, "elapsed_time": "0:19:33", "remaining_time": "1:31:46"} +{"current_steps": 100, "total_steps": 569, "loss": 0.3593, "reward": null, "learning_rate": 9.313933643837825e-06, "epoch": 0.18, "percentage": 17.57, "elapsed_time": "0:19:33", "remaining_time": "1:31:46"} +{"current_steps": 110, "total_steps": 569, "loss": 0.1982, "reward": null, "learning_rate": 9.167862422623474e-06, "epoch": 0.19, "percentage": 19.33, "elapsed_time": "0:21:31", "remaining_time": "1:29:50"} +{"current_steps": 110, "total_steps": 569, "loss": 0.1982, "reward": null, "learning_rate": 9.167862422623474e-06, "epoch": 0.19, "percentage": 19.33, "elapsed_time": "0:21:31", "remaining_time": "1:29:50"} +{"current_steps": 110, "total_steps": 569, "loss": 0.1982, "reward": null, "learning_rate": 9.167862422623474e-06, "epoch": 0.19, "percentage": 19.33, "elapsed_time": "0:21:31", "remaining_time": "1:29:50"} +{"current_steps": 110, "total_steps": 569, "loss": 0.1982, "reward": null, "learning_rate": 9.167862422623474e-06, "epoch": 0.19, "percentage": 19.33, "elapsed_time": "0:21:31", "remaining_time": "1:29:50"} +{"current_steps": 120, "total_steps": 569, "loss": 0.1791, "reward": null, "learning_rate": 9.009089021531777e-06, "epoch": 0.21, "percentage": 21.09, "elapsed_time": "0:23:33", "remaining_time": "1:28:07"} +{"current_steps": 120, "total_steps": 569, "loss": 0.1791, "reward": null, "learning_rate": 9.009089021531777e-06, "epoch": 0.21, "percentage": 21.09, "elapsed_time": "0:23:33", "remaining_time": "1:28:07"} +{"current_steps": 120, "total_steps": 569, "loss": 0.1791, "reward": null, "learning_rate": 9.009089021531777e-06, "epoch": 0.21, "percentage": 21.09, "elapsed_time": "0:23:33", "remaining_time": "1:28:07"} +{"current_steps": 120, "total_steps": 569, "loss": 0.1791, "reward": null, "learning_rate": 9.009089021531777e-06, "epoch": 0.21, "percentage": 21.09, "elapsed_time": "0:23:33", "remaining_time": "1:28:07"} +{"current_steps": 130, "total_steps": 569, "loss": 0.1522, "reward": null, "learning_rate": 8.838097326088667e-06, "epoch": 0.23, "percentage": 22.85, "elapsed_time": "0:25:29", "remaining_time": "1:26:06"} +{"current_steps": 130, "total_steps": 569, "loss": 0.1522, "reward": null, "learning_rate": 8.838097326088667e-06, "epoch": 0.23, "percentage": 22.85, "elapsed_time": "0:25:29", "remaining_time": "1:26:06"} +{"current_steps": 130, "total_steps": 569, "loss": 0.1522, "reward": null, "learning_rate": 8.838097326088667e-06, "epoch": 0.23, "percentage": 22.85, "elapsed_time": "0:25:29", "remaining_time": "1:26:06"} +{"current_steps": 130, "total_steps": 569, "loss": 0.1522, "reward": null, "learning_rate": 8.838097326088667e-06, "epoch": 0.23, "percentage": 22.85, "elapsed_time": "0:25:29", "remaining_time": "1:26:06"} +{"current_steps": 140, "total_steps": 569, "loss": 0.1841, "reward": null, "learning_rate": 8.65540845888717e-06, "epoch": 0.25, "percentage": 24.6, "elapsed_time": "0:27:24", "remaining_time": "1:24:00"} +{"current_steps": 140, "total_steps": 569, "loss": 0.1841, "reward": null, "learning_rate": 8.65540845888717e-06, "epoch": 0.25, "percentage": 24.6, "elapsed_time": "0:27:24", "remaining_time": "1:24:00"} +{"current_steps": 140, "total_steps": 569, "loss": 0.1841, "reward": null, "learning_rate": 8.65540845888717e-06, "epoch": 0.25, "percentage": 24.6, "elapsed_time": "0:27:24", "remaining_time": "1:24:00"} +{"current_steps": 140, "total_steps": 569, "loss": 0.1841, "reward": null, "learning_rate": 8.65540845888717e-06, "epoch": 0.25, "percentage": 24.6, "elapsed_time": "0:27:24", "remaining_time": "1:24:00"} +{"current_steps": 150, "total_steps": 569, "loss": 0.1299, "reward": null, "learning_rate": 8.46157919138889e-06, "epoch": 0.26, "percentage": 26.36, "elapsed_time": "0:29:21", "remaining_time": "1:21:59"} +{"current_steps": 150, "total_steps": 569, "loss": 0.1299, "reward": null, "learning_rate": 8.46157919138889e-06, "epoch": 0.26, "percentage": 26.36, "elapsed_time": "0:29:21", "remaining_time": "1:21:59"} +{"current_steps": 150, "total_steps": 569, "loss": 0.1299, "reward": null, "learning_rate": 8.46157919138889e-06, "epoch": 0.26, "percentage": 26.36, "elapsed_time": "0:29:21", "remaining_time": "1:21:59"} +{"current_steps": 150, "total_steps": 569, "loss": 0.1299, "reward": null, "learning_rate": 8.46157919138889e-06, "epoch": 0.26, "percentage": 26.36, "elapsed_time": "0:29:21", "remaining_time": "1:21:59"} +{"current_steps": 160, "total_steps": 569, "loss": 0.1695, "reward": null, "learning_rate": 8.257200247080249e-06, "epoch": 0.28, "percentage": 28.12, "elapsed_time": "0:31:15", "remaining_time": "1:19:55"} +{"current_steps": 160, "total_steps": 569, "loss": 0.1695, "reward": null, "learning_rate": 8.257200247080249e-06, "epoch": 0.28, "percentage": 28.12, "elapsed_time": "0:31:15", "remaining_time": "1:19:55"} +{"current_steps": 160, "total_steps": 569, "loss": 0.1695, "reward": null, "learning_rate": 8.257200247080249e-06, "epoch": 0.28, "percentage": 28.12, "elapsed_time": "0:31:15", "remaining_time": "1:19:55"} +{"current_steps": 160, "total_steps": 569, "loss": 0.1695, "reward": null, "learning_rate": 8.257200247080249e-06, "epoch": 0.28, "percentage": 28.12, "elapsed_time": "0:31:15", "remaining_time": "1:19:55"} +{"current_steps": 170, "total_steps": 569, "loss": 0.1536, "reward": null, "learning_rate": 8.042894501154937e-06, "epoch": 0.3, "percentage": 29.88, "elapsed_time": "0:33:12", "remaining_time": "1:17:55"} +{"current_steps": 170, "total_steps": 569, "loss": 0.1536, "reward": null, "learning_rate": 8.042894501154937e-06, "epoch": 0.3, "percentage": 29.88, "elapsed_time": "0:33:12", "remaining_time": "1:17:55"} +{"current_steps": 170, "total_steps": 569, "loss": 0.1536, "reward": null, "learning_rate": 8.042894501154937e-06, "epoch": 0.3, "percentage": 29.88, "elapsed_time": "0:33:12", "remaining_time": "1:17:55"} +{"current_steps": 170, "total_steps": 569, "loss": 0.1536, "reward": null, "learning_rate": 8.042894501154937e-06, "epoch": 0.3, "percentage": 29.88, "elapsed_time": "0:33:12", "remaining_time": "1:17:55"} +{"current_steps": 180, "total_steps": 569, "loss": 0.1233, "reward": null, "learning_rate": 7.819315082209217e-06, "epoch": 0.32, "percentage": 31.63, "elapsed_time": "0:35:08", "remaining_time": "1:15:57"} +{"current_steps": 180, "total_steps": 569, "loss": 0.1233, "reward": null, "learning_rate": 7.819315082209217e-06, "epoch": 0.32, "percentage": 31.63, "elapsed_time": "0:35:08", "remaining_time": "1:15:57"} +{"current_steps": 180, "total_steps": 569, "loss": 0.1233, "reward": null, "learning_rate": 7.819315082209217e-06, "epoch": 0.32, "percentage": 31.63, "elapsed_time": "0:35:08", "remaining_time": "1:15:57"} +{"current_steps": 180, "total_steps": 569, "loss": 0.1233, "reward": null, "learning_rate": 7.819315082209217e-06, "epoch": 0.32, "percentage": 31.63, "elapsed_time": "0:35:08", "remaining_time": "1:15:57"} +{"current_steps": 190, "total_steps": 569, "loss": 0.1254, "reward": null, "learning_rate": 7.587143381735498e-06, "epoch": 0.33, "percentage": 33.39, "elapsed_time": "0:37:04", "remaining_time": "1:13:56"} +{"current_steps": 190, "total_steps": 569, "loss": 0.1254, "reward": null, "learning_rate": 7.587143381735498e-06, "epoch": 0.33, "percentage": 33.39, "elapsed_time": "0:37:04", "remaining_time": "1:13:56"} +{"current_steps": 190, "total_steps": 569, "loss": 0.1254, "reward": null, "learning_rate": 7.587143381735498e-06, "epoch": 0.33, "percentage": 33.39, "elapsed_time": "0:37:04", "remaining_time": "1:13:56"} +{"current_steps": 190, "total_steps": 569, "loss": 0.1254, "reward": null, "learning_rate": 7.587143381735498e-06, "epoch": 0.33, "percentage": 33.39, "elapsed_time": "0:37:04", "remaining_time": "1:13:56"} +{"current_steps": 200, "total_steps": 569, "loss": 0.1153, "reward": null, "learning_rate": 7.347086977480552e-06, "epoch": 0.35, "percentage": 35.15, "elapsed_time": "0:39:05", "remaining_time": "1:12:06"} +{"current_steps": 200, "total_steps": 569, "loss": 0.1153, "reward": null, "learning_rate": 7.347086977480552e-06, "epoch": 0.35, "percentage": 35.15, "elapsed_time": "0:39:05", "remaining_time": "1:12:06"} +{"current_steps": 200, "total_steps": 569, "loss": 0.1153, "reward": null, "learning_rate": 7.347086977480552e-06, "epoch": 0.35, "percentage": 35.15, "elapsed_time": "0:39:05", "remaining_time": "1:12:06"} +{"current_steps": 200, "total_steps": 569, "loss": 0.1153, "reward": null, "learning_rate": 7.347086977480552e-06, "epoch": 0.35, "percentage": 35.15, "elapsed_time": "0:39:05", "remaining_time": "1:12:06"} +{"current_steps": 210, "total_steps": 569, "loss": 0.1524, "reward": null, "learning_rate": 7.09987747699721e-06, "epoch": 0.37, "percentage": 36.91, "elapsed_time": "0:41:00", "remaining_time": "1:10:07"} +{"current_steps": 210, "total_steps": 569, "loss": 0.1524, "reward": null, "learning_rate": 7.09987747699721e-06, "epoch": 0.37, "percentage": 36.91, "elapsed_time": "0:41:00", "remaining_time": "1:10:07"} +{"current_steps": 210, "total_steps": 569, "loss": 0.1524, "reward": null, "learning_rate": 7.09987747699721e-06, "epoch": 0.37, "percentage": 36.91, "elapsed_time": "0:41:00", "remaining_time": "1:10:07"} +{"current_steps": 210, "total_steps": 569, "loss": 0.1524, "reward": null, "learning_rate": 7.09987747699721e-06, "epoch": 0.37, "percentage": 36.91, "elapsed_time": "0:41:00", "remaining_time": "1:10:07"} +{"current_steps": 220, "total_steps": 569, "loss": 0.1299, "reward": null, "learning_rate": 6.846268287961667e-06, "epoch": 0.39, "percentage": 38.66, "elapsed_time": "0:42:51", "remaining_time": "1:07:59"} +{"current_steps": 220, "total_steps": 569, "loss": 0.1299, "reward": null, "learning_rate": 6.846268287961667e-06, "epoch": 0.39, "percentage": 38.66, "elapsed_time": "0:42:51", "remaining_time": "1:07:59"} +{"current_steps": 220, "total_steps": 569, "loss": 0.1299, "reward": null, "learning_rate": 6.846268287961667e-06, "epoch": 0.39, "percentage": 38.66, "elapsed_time": "0:42:51", "remaining_time": "1:07:59"} +{"current_steps": 220, "total_steps": 569, "loss": 0.1299, "reward": null, "learning_rate": 6.846268287961667e-06, "epoch": 0.39, "percentage": 38.66, "elapsed_time": "0:42:51", "remaining_time": "1:07:59"} +{"current_steps": 230, "total_steps": 569, "loss": 0.1232, "reward": null, "learning_rate": 6.587032322051667e-06, "epoch": 0.4, "percentage": 40.42, "elapsed_time": "0:44:48", "remaining_time": "1:06:02"} +{"current_steps": 230, "total_steps": 569, "loss": 0.1232, "reward": null, "learning_rate": 6.587032322051667e-06, "epoch": 0.4, "percentage": 40.42, "elapsed_time": "0:44:48", "remaining_time": "1:06:02"} +{"current_steps": 230, "total_steps": 569, "loss": 0.1232, "reward": null, "learning_rate": 6.587032322051667e-06, "epoch": 0.4, "percentage": 40.42, "elapsed_time": "0:44:48", "remaining_time": "1:06:02"} +{"current_steps": 230, "total_steps": 569, "loss": 0.1232, "reward": null, "learning_rate": 6.587032322051667e-06, "epoch": 0.4, "percentage": 40.42, "elapsed_time": "0:44:48", "remaining_time": "1:06:02"} +{"current_steps": 240, "total_steps": 569, "loss": 0.1385, "reward": null, "learning_rate": 6.32295963938335e-06, "epoch": 0.42, "percentage": 42.18, "elapsed_time": "0:46:46", "remaining_time": "1:04:06"} +{"current_steps": 240, "total_steps": 569, "loss": 0.1385, "reward": null, "learning_rate": 6.32295963938335e-06, "epoch": 0.42, "percentage": 42.18, "elapsed_time": "0:46:46", "remaining_time": "1:04:06"} +{"current_steps": 240, "total_steps": 569, "loss": 0.1385, "reward": null, "learning_rate": 6.32295963938335e-06, "epoch": 0.42, "percentage": 42.18, "elapsed_time": "0:46:46", "remaining_time": "1:04:06"} +{"current_steps": 240, "total_steps": 569, "loss": 0.1385, "reward": null, "learning_rate": 6.32295963938335e-06, "epoch": 0.42, "percentage": 42.18, "elapsed_time": "0:46:46", "remaining_time": "1:04:06"} +{"current_steps": 250, "total_steps": 569, "loss": 0.1248, "reward": null, "learning_rate": 6.05485504068568e-06, "epoch": 0.44, "percentage": 43.94, "elapsed_time": "0:48:41", "remaining_time": "1:02:08"} +{"current_steps": 250, "total_steps": 569, "loss": 0.1248, "reward": null, "learning_rate": 6.05485504068568e-06, "epoch": 0.44, "percentage": 43.94, "elapsed_time": "0:48:41", "remaining_time": "1:02:08"} +{"current_steps": 250, "total_steps": 569, "loss": 0.1248, "reward": null, "learning_rate": 6.05485504068568e-06, "epoch": 0.44, "percentage": 43.94, "elapsed_time": "0:48:41", "remaining_time": "1:02:08"} +{"current_steps": 250, "total_steps": 569, "loss": 0.1248, "reward": null, "learning_rate": 6.05485504068568e-06, "epoch": 0.44, "percentage": 43.94, "elapsed_time": "0:48:41", "remaining_time": "1:02:08"} +{"current_steps": 260, "total_steps": 569, "loss": 0.1271, "reward": null, "learning_rate": 5.783535614550666e-06, "epoch": 0.46, "percentage": 45.69, "elapsed_time": "0:50:36", "remaining_time": "1:00:09"} +{"current_steps": 260, "total_steps": 569, "loss": 0.1271, "reward": null, "learning_rate": 5.783535614550666e-06, "epoch": 0.46, "percentage": 45.69, "elapsed_time": "0:50:36", "remaining_time": "1:00:09"} +{"current_steps": 260, "total_steps": 569, "loss": 0.1271, "reward": null, "learning_rate": 5.783535614550666e-06, "epoch": 0.46, "percentage": 45.69, "elapsed_time": "0:50:36", "remaining_time": "1:00:09"} +{"current_steps": 260, "total_steps": 569, "loss": 0.1271, "reward": null, "learning_rate": 5.783535614550666e-06, "epoch": 0.46, "percentage": 45.69, "elapsed_time": "0:50:36", "remaining_time": "1:00:09"} +{"current_steps": 270, "total_steps": 569, "loss": 0.073, "reward": null, "learning_rate": 5.509828247234505e-06, "epoch": 0.47, "percentage": 47.45, "elapsed_time": "0:52:32", "remaining_time": "0:58:11"} +{"current_steps": 270, "total_steps": 569, "loss": 0.073, "reward": null, "learning_rate": 5.509828247234505e-06, "epoch": 0.47, "percentage": 47.45, "elapsed_time": "0:52:32", "remaining_time": "0:58:11"} +{"current_steps": 270, "total_steps": 569, "loss": 0.073, "reward": null, "learning_rate": 5.509828247234505e-06, "epoch": 0.47, "percentage": 47.45, "elapsed_time": "0:52:32", "remaining_time": "0:58:11"} +{"current_steps": 270, "total_steps": 569, "loss": 0.073, "reward": null, "learning_rate": 5.509828247234505e-06, "epoch": 0.47, "percentage": 47.45, "elapsed_time": "0:52:32", "remaining_time": "0:58:11"} +{"current_steps": 280, "total_steps": 569, "loss": 0.1234, "reward": null, "learning_rate": 5.234567102598881e-06, "epoch": 0.49, "percentage": 49.21, "elapsed_time": "0:54:32", "remaining_time": "0:56:17"} +{"current_steps": 280, "total_steps": 569, "loss": 0.1234, "reward": null, "learning_rate": 5.234567102598881e-06, "epoch": 0.49, "percentage": 49.21, "elapsed_time": "0:54:32", "remaining_time": "0:56:17"} +{"current_steps": 280, "total_steps": 569, "loss": 0.1234, "reward": null, "learning_rate": 5.234567102598881e-06, "epoch": 0.49, "percentage": 49.21, "elapsed_time": "0:54:32", "remaining_time": "0:56:17"} +{"current_steps": 280, "total_steps": 569, "loss": 0.1234, "reward": null, "learning_rate": 5.234567102598881e-06, "epoch": 0.49, "percentage": 49.21, "elapsed_time": "0:54:32", "remaining_time": "0:56:17"} +{"current_steps": 290, "total_steps": 569, "loss": 0.1003, "reward": null, "learning_rate": 4.958591079872667e-06, "epoch": 0.51, "percentage": 50.97, "elapsed_time": "0:56:29", "remaining_time": "0:54:21"} +{"current_steps": 290, "total_steps": 569, "loss": 0.1003, "reward": null, "learning_rate": 4.958591079872667e-06, "epoch": 0.51, "percentage": 50.97, "elapsed_time": "0:56:29", "remaining_time": "0:54:21"} +{"current_steps": 290, "total_steps": 569, "loss": 0.1003, "reward": null, "learning_rate": 4.958591079872667e-06, "epoch": 0.51, "percentage": 50.97, "elapsed_time": "0:56:29", "remaining_time": "0:54:21"} +{"current_steps": 290, "total_steps": 569, "loss": 0.1003, "reward": null, "learning_rate": 4.958591079872667e-06, "epoch": 0.51, "percentage": 50.97, "elapsed_time": "0:56:29", "remaining_time": "0:54:21"} +{"current_steps": 300, "total_steps": 569, "loss": 0.1757, "reward": null, "learning_rate": 4.682741256981922e-06, "epoch": 0.53, "percentage": 52.72, "elapsed_time": "0:58:22", "remaining_time": "0:52:20"} +{"current_steps": 300, "total_steps": 569, "loss": 0.1757, "reward": null, "learning_rate": 4.682741256981922e-06, "epoch": 0.53, "percentage": 52.72, "elapsed_time": "0:58:22", "remaining_time": "0:52:20"} +{"current_steps": 300, "total_steps": 569, "loss": 0.1757, "reward": null, "learning_rate": 4.682741256981922e-06, "epoch": 0.53, "percentage": 52.72, "elapsed_time": "0:58:22", "remaining_time": "0:52:20"} +{"current_steps": 300, "total_steps": 569, "loss": 0.1757, "reward": null, "learning_rate": 4.682741256981922e-06, "epoch": 0.53, "percentage": 52.72, "elapsed_time": "0:58:22", "remaining_time": "0:52:20"} +{"current_steps": 310, "total_steps": 569, "loss": 0.1151, "reward": null, "learning_rate": 4.407858327239952e-06, "epoch": 0.54, "percentage": 54.48, "elapsed_time": "1:00:16", "remaining_time": "0:50:21"} +{"current_steps": 310, "total_steps": 569, "loss": 0.1151, "reward": null, "learning_rate": 4.407858327239952e-06, "epoch": 0.54, "percentage": 54.48, "elapsed_time": "1:00:16", "remaining_time": "0:50:21"} +{"current_steps": 310, "total_steps": 569, "loss": 0.1151, "reward": null, "learning_rate": 4.407858327239952e-06, "epoch": 0.54, "percentage": 54.48, "elapsed_time": "1:00:16", "remaining_time": "0:50:21"} +{"current_steps": 310, "total_steps": 569, "loss": 0.1151, "reward": null, "learning_rate": 4.407858327239952e-06, "epoch": 0.54, "percentage": 54.48, "elapsed_time": "1:00:16", "remaining_time": "0:50:21"} +{"current_steps": 320, "total_steps": 569, "loss": 0.1124, "reward": null, "learning_rate": 4.134780037209563e-06, "epoch": 0.56, "percentage": 56.24, "elapsed_time": "1:02:12", "remaining_time": "0:48:24"} +{"current_steps": 320, "total_steps": 569, "loss": 0.1124, "reward": null, "learning_rate": 4.134780037209563e-06, "epoch": 0.56, "percentage": 56.24, "elapsed_time": "1:02:12", "remaining_time": "0:48:24"} +{"current_steps": 320, "total_steps": 569, "loss": 0.1124, "reward": null, "learning_rate": 4.134780037209563e-06, "epoch": 0.56, "percentage": 56.24, "elapsed_time": "1:02:12", "remaining_time": "0:48:24"} +{"current_steps": 320, "total_steps": 569, "loss": 0.1124, "reward": null, "learning_rate": 4.134780037209563e-06, "epoch": 0.56, "percentage": 56.24, "elapsed_time": "1:02:12", "remaining_time": "0:48:24"} +{"current_steps": 330, "total_steps": 569, "loss": 0.0899, "reward": null, "learning_rate": 3.864338633545956e-06, "epoch": 0.58, "percentage": 58.0, "elapsed_time": "1:04:11", "remaining_time": "0:46:29"} +{"current_steps": 330, "total_steps": 569, "loss": 0.0899, "reward": null, "learning_rate": 3.864338633545956e-06, "epoch": 0.58, "percentage": 58.0, "elapsed_time": "1:04:11", "remaining_time": "0:46:29"} +{"current_steps": 330, "total_steps": 569, "loss": 0.0899, "reward": null, "learning_rate": 3.864338633545956e-06, "epoch": 0.58, "percentage": 58.0, "elapsed_time": "1:04:11", "remaining_time": "0:46:29"} +{"current_steps": 330, "total_steps": 569, "loss": 0.0899, "reward": null, "learning_rate": 3.864338633545956e-06, "epoch": 0.58, "percentage": 58.0, "elapsed_time": "1:04:11", "remaining_time": "0:46:29"} +{"current_steps": 340, "total_steps": 569, "loss": 0.1251, "reward": null, "learning_rate": 3.597358326601413e-06, "epoch": 0.6, "percentage": 59.75, "elapsed_time": "1:06:08", "remaining_time": "0:44:33"} +{"current_steps": 340, "total_steps": 569, "loss": 0.1251, "reward": null, "learning_rate": 3.597358326601413e-06, "epoch": 0.6, "percentage": 59.75, "elapsed_time": "1:06:08", "remaining_time": "0:44:33"} +{"current_steps": 340, "total_steps": 569, "loss": 0.1251, "reward": null, "learning_rate": 3.597358326601413e-06, "epoch": 0.6, "percentage": 59.75, "elapsed_time": "1:06:08", "remaining_time": "0:44:33"} +{"current_steps": 340, "total_steps": 569, "loss": 0.1251, "reward": null, "learning_rate": 3.597358326601413e-06, "epoch": 0.6, "percentage": 59.75, "elapsed_time": "1:06:08", "remaining_time": "0:44:33"} +{"current_steps": 350, "total_steps": 569, "loss": 0.171, "reward": null, "learning_rate": 3.334652778521813e-06, "epoch": 0.61, "percentage": 61.51, "elapsed_time": "1:08:02", "remaining_time": "0:42:34"} +{"current_steps": 350, "total_steps": 569, "loss": 0.171, "reward": null, "learning_rate": 3.334652778521813e-06, "epoch": 0.61, "percentage": 61.51, "elapsed_time": "1:08:02", "remaining_time": "0:42:34"} +{"current_steps": 350, "total_steps": 569, "loss": 0.171, "reward": null, "learning_rate": 3.334652778521813e-06, "epoch": 0.61, "percentage": 61.51, "elapsed_time": "1:08:02", "remaining_time": "0:42:34"} +{"current_steps": 350, "total_steps": 569, "loss": 0.171, "reward": null, "learning_rate": 3.334652778521813e-06, "epoch": 0.61, "percentage": 61.51, "elapsed_time": "1:08:02", "remaining_time": "0:42:34"} +{"current_steps": 360, "total_steps": 569, "loss": 0.1447, "reward": null, "learning_rate": 3.077022623490371e-06, "epoch": 0.63, "percentage": 63.27, "elapsed_time": "1:09:56", "remaining_time": "0:40:36"} +{"current_steps": 360, "total_steps": 569, "loss": 0.1447, "reward": null, "learning_rate": 3.077022623490371e-06, "epoch": 0.63, "percentage": 63.27, "elapsed_time": "1:09:56", "remaining_time": "0:40:36"} +{"current_steps": 360, "total_steps": 569, "loss": 0.1447, "reward": null, "learning_rate": 3.077022623490371e-06, "epoch": 0.63, "percentage": 63.27, "elapsed_time": "1:09:56", "remaining_time": "0:40:36"} +{"current_steps": 360, "total_steps": 569, "loss": 0.1447, "reward": null, "learning_rate": 3.077022623490371e-06, "epoch": 0.63, "percentage": 63.27, "elapsed_time": "1:09:56", "remaining_time": "0:40:36"} +{"current_steps": 370, "total_steps": 569, "loss": 0.1192, "reward": null, "learning_rate": 2.825253027676026e-06, "epoch": 0.65, "percentage": 65.03, "elapsed_time": "1:11:52", "remaining_time": "0:38:39"} +{"current_steps": 370, "total_steps": 569, "loss": 0.1192, "reward": null, "learning_rate": 2.825253027676026e-06, "epoch": 0.65, "percentage": 65.03, "elapsed_time": "1:11:52", "remaining_time": "0:38:39"} +{"current_steps": 370, "total_steps": 569, "loss": 0.1192, "reward": null, "learning_rate": 2.825253027676026e-06, "epoch": 0.65, "percentage": 65.03, "elapsed_time": "1:11:52", "remaining_time": "0:38:39"} +{"current_steps": 370, "total_steps": 569, "loss": 0.1192, "reward": null, "learning_rate": 2.825253027676026e-06, "epoch": 0.65, "percentage": 65.03, "elapsed_time": "1:11:52", "remaining_time": "0:38:39"} +{"current_steps": 380, "total_steps": 569, "loss": 0.1158, "reward": null, "learning_rate": 2.580111296322904e-06, "epoch": 0.67, "percentage": 66.78, "elapsed_time": "1:13:46", "remaining_time": "0:36:41"} +{"current_steps": 380, "total_steps": 569, "loss": 0.1158, "reward": null, "learning_rate": 2.580111296322904e-06, "epoch": 0.67, "percentage": 66.78, "elapsed_time": "1:13:46", "remaining_time": "0:36:41"} +{"current_steps": 380, "total_steps": 569, "loss": 0.1158, "reward": null, "learning_rate": 2.580111296322904e-06, "epoch": 0.67, "percentage": 66.78, "elapsed_time": "1:13:46", "remaining_time": "0:36:41"} +{"current_steps": 380, "total_steps": 569, "loss": 0.1158, "reward": null, "learning_rate": 2.580111296322904e-06, "epoch": 0.67, "percentage": 66.78, "elapsed_time": "1:13:46", "remaining_time": "0:36:41"} +{"current_steps": 390, "total_steps": 569, "loss": 0.1028, "reward": null, "learning_rate": 2.342344535273608e-06, "epoch": 0.68, "percentage": 68.54, "elapsed_time": "1:15:39", "remaining_time": "0:34:43"} +{"current_steps": 390, "total_steps": 569, "loss": 0.1028, "reward": null, "learning_rate": 2.342344535273608e-06, "epoch": 0.68, "percentage": 68.54, "elapsed_time": "1:15:39", "remaining_time": "0:34:43"} +{"current_steps": 390, "total_steps": 569, "loss": 0.1028, "reward": null, "learning_rate": 2.342344535273608e-06, "epoch": 0.68, "percentage": 68.54, "elapsed_time": "1:15:39", "remaining_time": "0:34:43"} +{"current_steps": 390, "total_steps": 569, "loss": 0.1028, "reward": null, "learning_rate": 2.342344535273608e-06, "epoch": 0.68, "percentage": 68.54, "elapsed_time": "1:15:39", "remaining_time": "0:34:43"} +{"current_steps": 400, "total_steps": 569, "loss": 0.1171, "reward": null, "learning_rate": 2.112677374053164e-06, "epoch": 0.7, "percentage": 70.3, "elapsed_time": "1:17:37", "remaining_time": "0:32:47"} +{"current_steps": 400, "total_steps": 569, "loss": 0.1171, "reward": null, "learning_rate": 2.112677374053164e-06, "epoch": 0.7, "percentage": 70.3, "elapsed_time": "1:17:37", "remaining_time": "0:32:47"} +{"current_steps": 400, "total_steps": 569, "loss": 0.1171, "reward": null, "learning_rate": 2.112677374053164e-06, "epoch": 0.7, "percentage": 70.3, "elapsed_time": "1:17:37", "remaining_time": "0:32:47"} +{"current_steps": 400, "total_steps": 569, "loss": 0.1171, "reward": null, "learning_rate": 2.112677374053164e-06, "epoch": 0.7, "percentage": 70.3, "elapsed_time": "1:17:37", "remaining_time": "0:32:47"} +{"current_steps": 410, "total_steps": 569, "loss": 0.1017, "reward": null, "learning_rate": 1.8918097574529193e-06, "epoch": 0.72, "percentage": 72.06, "elapsed_time": "1:19:31", "remaining_time": "0:30:50"} +{"current_steps": 410, "total_steps": 569, "loss": 0.1017, "reward": null, "learning_rate": 1.8918097574529193e-06, "epoch": 0.72, "percentage": 72.06, "elapsed_time": "1:19:31", "remaining_time": "0:30:50"} +{"current_steps": 410, "total_steps": 569, "loss": 0.1017, "reward": null, "learning_rate": 1.8918097574529193e-06, "epoch": 0.72, "percentage": 72.06, "elapsed_time": "1:19:31", "remaining_time": "0:30:50"} +{"current_steps": 410, "total_steps": 569, "loss": 0.1017, "reward": null, "learning_rate": 1.8918097574529193e-06, "epoch": 0.72, "percentage": 72.06, "elapsed_time": "1:19:31", "remaining_time": "0:30:50"} +{"current_steps": 420, "total_steps": 569, "loss": 0.0763, "reward": null, "learning_rate": 1.68041481234479e-06, "epoch": 0.74, "percentage": 73.81, "elapsed_time": "1:21:28", "remaining_time": "0:28:54"} +{"current_steps": 420, "total_steps": 569, "loss": 0.0763, "reward": null, "learning_rate": 1.68041481234479e-06, "epoch": 0.74, "percentage": 73.81, "elapsed_time": "1:21:28", "remaining_time": "0:28:54"} +{"current_steps": 420, "total_steps": 569, "loss": 0.0763, "reward": null, "learning_rate": 1.68041481234479e-06, "epoch": 0.74, "percentage": 73.81, "elapsed_time": "1:21:28", "remaining_time": "0:28:54"} +{"current_steps": 420, "total_steps": 569, "loss": 0.0763, "reward": null, "learning_rate": 1.68041481234479e-06, "epoch": 0.74, "percentage": 73.81, "elapsed_time": "1:21:28", "remaining_time": "0:28:54"} +{"current_steps": 430, "total_steps": 569, "loss": 0.1185, "reward": null, "learning_rate": 1.4791367962271425e-06, "epoch": 0.76, "percentage": 75.57, "elapsed_time": "1:23:23", "remaining_time": "0:26:57"} +{"current_steps": 430, "total_steps": 569, "loss": 0.1185, "reward": null, "learning_rate": 1.4791367962271425e-06, "epoch": 0.76, "percentage": 75.57, "elapsed_time": "1:23:23", "remaining_time": "0:26:57"} +{"current_steps": 430, "total_steps": 569, "loss": 0.1185, "reward": null, "learning_rate": 1.4791367962271425e-06, "epoch": 0.76, "percentage": 75.57, "elapsed_time": "1:23:23", "remaining_time": "0:26:57"} +{"current_steps": 430, "total_steps": 569, "loss": 0.1185, "reward": null, "learning_rate": 1.4791367962271425e-06, "epoch": 0.76, "percentage": 75.57, "elapsed_time": "1:23:23", "remaining_time": "0:26:57"} +{"current_steps": 440, "total_steps": 569, "loss": 0.0701, "reward": null, "learning_rate": 1.2885891337543539e-06, "epoch": 0.77, "percentage": 77.33, "elapsed_time": "1:25:17", "remaining_time": "0:25:00"} +{"current_steps": 440, "total_steps": 569, "loss": 0.0701, "reward": null, "learning_rate": 1.2885891337543539e-06, "epoch": 0.77, "percentage": 77.33, "elapsed_time": "1:25:17", "remaining_time": "0:25:00"} +{"current_steps": 440, "total_steps": 569, "loss": 0.0701, "reward": null, "learning_rate": 1.2885891337543539e-06, "epoch": 0.77, "percentage": 77.33, "elapsed_time": "1:25:17", "remaining_time": "0:25:00"} +{"current_steps": 440, "total_steps": 569, "loss": 0.0701, "reward": null, "learning_rate": 1.2885891337543539e-06, "epoch": 0.77, "percentage": 77.33, "elapsed_time": "1:25:17", "remaining_time": "0:25:00"} +{"current_steps": 450, "total_steps": 569, "loss": 0.0873, "reward": null, "learning_rate": 1.1093525472340471e-06, "epoch": 0.79, "percentage": 79.09, "elapsed_time": "1:27:16", "remaining_time": "0:23:04"} +{"current_steps": 450, "total_steps": 569, "loss": 0.0873, "reward": null, "learning_rate": 1.1093525472340471e-06, "epoch": 0.79, "percentage": 79.09, "elapsed_time": "1:27:16", "remaining_time": "0:23:04"} +{"current_steps": 450, "total_steps": 569, "loss": 0.0873, "reward": null, "learning_rate": 1.1093525472340471e-06, "epoch": 0.79, "percentage": 79.09, "elapsed_time": "1:27:16", "remaining_time": "0:23:04"} +{"current_steps": 450, "total_steps": 569, "loss": 0.0873, "reward": null, "learning_rate": 1.1093525472340471e-06, "epoch": 0.79, "percentage": 79.09, "elapsed_time": "1:27:16", "remaining_time": "0:23:04"} +{"current_steps": 460, "total_steps": 569, "loss": 0.127, "reward": null, "learning_rate": 9.419732867896048e-07, "epoch": 0.81, "percentage": 80.84, "elapsed_time": "1:29:09", "remaining_time": "0:21:07"} +{"current_steps": 460, "total_steps": 569, "loss": 0.127, "reward": null, "learning_rate": 9.419732867896048e-07, "epoch": 0.81, "percentage": 80.84, "elapsed_time": "1:29:09", "remaining_time": "0:21:07"} +{"current_steps": 460, "total_steps": 569, "loss": 0.127, "reward": null, "learning_rate": 9.419732867896048e-07, "epoch": 0.81, "percentage": 80.84, "elapsed_time": "1:29:09", "remaining_time": "0:21:07"} +{"current_steps": 460, "total_steps": 569, "loss": 0.127, "reward": null, "learning_rate": 9.419732867896048e-07, "epoch": 0.81, "percentage": 80.84, "elapsed_time": "1:29:09", "remaining_time": "0:21:07"} +{"current_steps": 470, "total_steps": 569, "loss": 0.1289, "reward": null, "learning_rate": 7.869614655817576e-07, "epoch": 0.83, "percentage": 82.6, "elapsed_time": "1:31:05", "remaining_time": "0:19:11"} +{"current_steps": 470, "total_steps": 569, "loss": 0.1289, "reward": null, "learning_rate": 7.869614655817576e-07, "epoch": 0.83, "percentage": 82.6, "elapsed_time": "1:31:05", "remaining_time": "0:19:11"} +{"current_steps": 470, "total_steps": 569, "loss": 0.1289, "reward": null, "learning_rate": 7.869614655817576e-07, "epoch": 0.83, "percentage": 82.6, "elapsed_time": "1:31:05", "remaining_time": "0:19:11"} +{"current_steps": 470, "total_steps": 569, "loss": 0.1289, "reward": null, "learning_rate": 7.869614655817576e-07, "epoch": 0.83, "percentage": 82.6, "elapsed_time": "1:31:05", "remaining_time": "0:19:11"} +{"current_steps": 480, "total_steps": 569, "loss": 0.1211, "reward": null, "learning_rate": 6.44789505162955e-07, "epoch": 0.84, "percentage": 84.36, "elapsed_time": "1:32:56", "remaining_time": "0:17:13"} +{"current_steps": 480, "total_steps": 569, "loss": 0.1211, "reward": null, "learning_rate": 6.44789505162955e-07, "epoch": 0.84, "percentage": 84.36, "elapsed_time": "1:32:56", "remaining_time": "0:17:13"} +{"current_steps": 480, "total_steps": 569, "loss": 0.1211, "reward": null, "learning_rate": 6.44789505162955e-07, "epoch": 0.84, "percentage": 84.36, "elapsed_time": "1:32:56", "remaining_time": "0:17:13"} +{"current_steps": 480, "total_steps": 569, "loss": 0.1211, "reward": null, "learning_rate": 6.44789505162955e-07, "epoch": 0.84, "percentage": 84.36, "elapsed_time": "1:32:56", "remaining_time": "0:17:13"} +{"current_steps": 490, "total_steps": 569, "loss": 0.094, "reward": null, "learning_rate": 5.158906957025079e-07, "epoch": 0.86, "percentage": 86.12, "elapsed_time": "1:34:54", "remaining_time": "0:15:18"} +{"current_steps": 490, "total_steps": 569, "loss": 0.094, "reward": null, "learning_rate": 5.158906957025079e-07, "epoch": 0.86, "percentage": 86.12, "elapsed_time": "1:34:54", "remaining_time": "0:15:18"} +{"current_steps": 490, "total_steps": 569, "loss": 0.094, "reward": null, "learning_rate": 5.158906957025079e-07, "epoch": 0.86, "percentage": 86.12, "elapsed_time": "1:34:54", "remaining_time": "0:15:18"} +{"current_steps": 490, "total_steps": 569, "loss": 0.094, "reward": null, "learning_rate": 5.158906957025079e-07, "epoch": 0.86, "percentage": 86.12, "elapsed_time": "1:34:54", "remaining_time": "0:15:18"} +{"current_steps": 500, "total_steps": 569, "loss": 0.09, "reward": null, "learning_rate": 4.0065787547042543e-07, "epoch": 0.88, "percentage": 87.87, "elapsed_time": "1:36:49", "remaining_time": "0:13:21"} +{"current_steps": 500, "total_steps": 569, "loss": 0.09, "reward": null, "learning_rate": 4.0065787547042543e-07, "epoch": 0.88, "percentage": 87.87, "elapsed_time": "1:36:49", "remaining_time": "0:13:21"} +{"current_steps": 500, "total_steps": 569, "loss": 0.09, "reward": null, "learning_rate": 4.0065787547042543e-07, "epoch": 0.88, "percentage": 87.87, "elapsed_time": "1:36:49", "remaining_time": "0:13:21"} +{"current_steps": 500, "total_steps": 569, "loss": 0.09, "reward": null, "learning_rate": 4.0065787547042543e-07, "epoch": 0.88, "percentage": 87.87, "elapsed_time": "1:36:49", "remaining_time": "0:13:21"} +{"current_steps": 510, "total_steps": 569, "loss": 0.1208, "reward": null, "learning_rate": 2.994422336044345e-07, "epoch": 0.9, "percentage": 89.63, "elapsed_time": "1:38:45", "remaining_time": "0:11:25"} +{"current_steps": 510, "total_steps": 569, "loss": 0.1208, "reward": null, "learning_rate": 2.994422336044345e-07, "epoch": 0.9, "percentage": 89.63, "elapsed_time": "1:38:45", "remaining_time": "0:11:25"} +{"current_steps": 510, "total_steps": 569, "loss": 0.1208, "reward": null, "learning_rate": 2.994422336044345e-07, "epoch": 0.9, "percentage": 89.63, "elapsed_time": "1:38:45", "remaining_time": "0:11:25"} +{"current_steps": 510, "total_steps": 569, "loss": 0.1208, "reward": null, "learning_rate": 2.994422336044345e-07, "epoch": 0.9, "percentage": 89.63, "elapsed_time": "1:38:45", "remaining_time": "0:11:25"} +{"current_steps": 520, "total_steps": 569, "loss": 0.0839, "reward": null, "learning_rate": 2.1255223980891027e-07, "epoch": 0.91, "percentage": 91.39, "elapsed_time": "1:40:42", "remaining_time": "0:09:29"} +{"current_steps": 520, "total_steps": 569, "loss": 0.0839, "reward": null, "learning_rate": 2.1255223980891027e-07, "epoch": 0.91, "percentage": 91.39, "elapsed_time": "1:40:42", "remaining_time": "0:09:29"} +{"current_steps": 520, "total_steps": 569, "loss": 0.0839, "reward": null, "learning_rate": 2.1255223980891027e-07, "epoch": 0.91, "percentage": 91.39, "elapsed_time": "1:40:42", "remaining_time": "0:09:29"} +{"current_steps": 520, "total_steps": 569, "loss": 0.0839, "reward": null, "learning_rate": 2.1255223980891027e-07, "epoch": 0.91, "percentage": 91.39, "elapsed_time": "1:40:42", "remaining_time": "0:09:29"} +{"current_steps": 530, "total_steps": 569, "loss": 0.0934, "reward": null, "learning_rate": 1.402527042476276e-07, "epoch": 0.93, "percentage": 93.15, "elapsed_time": "1:42:39", "remaining_time": "0:07:33"} +{"current_steps": 530, "total_steps": 569, "loss": 0.0934, "reward": null, "learning_rate": 1.402527042476276e-07, "epoch": 0.93, "percentage": 93.15, "elapsed_time": "1:42:39", "remaining_time": "0:07:33"} +{"current_steps": 530, "total_steps": 569, "loss": 0.0934, "reward": null, "learning_rate": 1.402527042476276e-07, "epoch": 0.93, "percentage": 93.15, "elapsed_time": "1:42:39", "remaining_time": "0:07:33"} +{"current_steps": 530, "total_steps": 569, "loss": 0.0934, "reward": null, "learning_rate": 1.402527042476276e-07, "epoch": 0.93, "percentage": 93.15, "elapsed_time": "1:42:39", "remaining_time": "0:07:33"} +{"current_steps": 540, "total_steps": 569, "loss": 0.094, "reward": null, "learning_rate": 8.276397049545359e-08, "epoch": 0.95, "percentage": 94.9, "elapsed_time": "1:44:33", "remaining_time": "0:05:36"} +{"current_steps": 540, "total_steps": 569, "loss": 0.094, "reward": null, "learning_rate": 8.276397049545359e-08, "epoch": 0.95, "percentage": 94.9, "elapsed_time": "1:44:33", "remaining_time": "0:05:36"} +{"current_steps": 540, "total_steps": 569, "loss": 0.094, "reward": null, "learning_rate": 8.276397049545359e-08, "epoch": 0.95, "percentage": 94.9, "elapsed_time": "1:44:33", "remaining_time": "0:05:36"} +{"current_steps": 540, "total_steps": 569, "loss": 0.094, "reward": null, "learning_rate": 8.276397049545359e-08, "epoch": 0.95, "percentage": 94.9, "elapsed_time": "1:44:33", "remaining_time": "0:05:36"} +{"current_steps": 550, "total_steps": 569, "loss": 0.0984, "reward": null, "learning_rate": 4.026124400856479e-08, "epoch": 0.97, "percentage": 96.66, "elapsed_time": "1:46:25", "remaining_time": "0:03:40"} +{"current_steps": 550, "total_steps": 569, "loss": 0.0984, "reward": null, "learning_rate": 4.026124400856479e-08, "epoch": 0.97, "percentage": 96.66, "elapsed_time": "1:46:25", "remaining_time": "0:03:40"} +{"current_steps": 550, "total_steps": 569, "loss": 0.0984, "reward": null, "learning_rate": 4.026124400856479e-08, "epoch": 0.97, "percentage": 96.66, "elapsed_time": "1:46:25", "remaining_time": "0:03:40"} +{"current_steps": 550, "total_steps": 569, "loss": 0.0984, "reward": null, "learning_rate": 4.026124400856479e-08, "epoch": 0.97, "percentage": 96.66, "elapsed_time": "1:46:25", "remaining_time": "0:03:40"} +{"current_steps": 560, "total_steps": 569, "loss": 0.0783, "reward": null, "learning_rate": 1.2874058159796366e-08, "epoch": 0.98, "percentage": 98.42, "elapsed_time": "1:48:21", "remaining_time": "0:01:44"} +{"current_steps": 560, "total_steps": 569, "loss": 0.0783, "reward": null, "learning_rate": 1.2874058159796366e-08, "epoch": 0.98, "percentage": 98.42, "elapsed_time": "1:48:21", "remaining_time": "0:01:44"} +{"current_steps": 560, "total_steps": 569, "loss": 0.0783, "reward": null, "learning_rate": 1.2874058159796366e-08, "epoch": 0.98, "percentage": 98.42, "elapsed_time": "1:48:21", "remaining_time": "0:01:44"} +{"current_steps": 560, "total_steps": 569, "loss": 0.0783, "reward": null, "learning_rate": 1.2874058159796366e-08, "epoch": 0.98, "percentage": 98.42, "elapsed_time": "1:48:21", "remaining_time": "0:01:44"} diff --git a/rm-lora/trainer_state.json b/rm-lora/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..dfa02f5564c87b6815555eb0d27e7c44f78100c2 --- /dev/null +++ b/rm-lora/trainer_state.json @@ -0,0 +1,361 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 0.9991220368744512, + "global_step": 569, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.02, + "learning_rate": 9.997256670306478e-06, + "loss": 0.6949, + "step": 10 + }, + { + "epoch": 0.04, + "learning_rate": 9.980502778148438e-06, + "loss": 0.6937, + "step": 20 + }, + { + "epoch": 0.05, + "learning_rate": 9.948570063910216e-06, + "loss": 0.6942, + "step": 30 + }, + { + "epoch": 0.07, + "learning_rate": 9.901555847282123e-06, + "loss": 0.6937, + "step": 40 + }, + { + "epoch": 0.09, + "learning_rate": 9.839603411073388e-06, + "loss": 0.675, + "step": 50 + }, + { + "epoch": 0.11, + "learning_rate": 9.762901564536523e-06, + "loss": 0.657, + "step": 60 + }, + { + "epoch": 0.12, + "learning_rate": 9.671684067943056e-06, + "loss": 0.6437, + "step": 70 + }, + { + "epoch": 0.14, + "learning_rate": 9.566228920164405e-06, + "loss": 0.6067, + "step": 80 + }, + { + "epoch": 0.16, + "learning_rate": 9.446857511429e-06, + "loss": 0.5389, + "step": 90 + }, + { + "epoch": 0.18, + "learning_rate": 9.313933643837825e-06, + "loss": 0.3593, + "step": 100 + }, + { + "epoch": 0.19, + "learning_rate": 9.167862422623474e-06, + "loss": 0.1982, + "step": 110 + }, + { + "epoch": 0.21, + "learning_rate": 9.009089021531777e-06, + "loss": 0.1791, + "step": 120 + }, + { + "epoch": 0.23, + "learning_rate": 8.838097326088667e-06, + "loss": 0.1522, + "step": 130 + }, + { + "epoch": 0.25, + "learning_rate": 8.65540845888717e-06, + "loss": 0.1841, + "step": 140 + }, + { + "epoch": 0.26, + "learning_rate": 8.46157919138889e-06, + "loss": 0.1299, + "step": 150 + }, + { + "epoch": 0.28, + "learning_rate": 8.257200247080249e-06, + "loss": 0.1695, + "step": 160 + }, + { + "epoch": 0.3, + "learning_rate": 8.042894501154937e-06, + "loss": 0.1536, + "step": 170 + }, + { + "epoch": 0.32, + "learning_rate": 7.819315082209217e-06, + "loss": 0.1233, + "step": 180 + }, + { + "epoch": 0.33, + "learning_rate": 7.587143381735498e-06, + "loss": 0.1254, + "step": 190 + }, + { + "epoch": 0.35, + "learning_rate": 7.347086977480552e-06, + "loss": 0.1153, + "step": 200 + }, + { + "epoch": 0.37, + "learning_rate": 7.09987747699721e-06, + "loss": 0.1524, + "step": 210 + }, + { + "epoch": 0.39, + "learning_rate": 6.846268287961667e-06, + "loss": 0.1299, + "step": 220 + }, + { + "epoch": 0.4, + "learning_rate": 6.587032322051667e-06, + "loss": 0.1232, + "step": 230 + }, + { + "epoch": 0.42, + "learning_rate": 6.32295963938335e-06, + "loss": 0.1385, + "step": 240 + }, + { + "epoch": 0.44, + "learning_rate": 6.05485504068568e-06, + "loss": 0.1248, + "step": 250 + }, + { + "epoch": 0.46, + "learning_rate": 5.783535614550666e-06, + "loss": 0.1271, + "step": 260 + }, + { + "epoch": 0.47, + "learning_rate": 5.509828247234505e-06, + "loss": 0.073, + "step": 270 + }, + { + "epoch": 0.49, + "learning_rate": 5.234567102598881e-06, + "loss": 0.1234, + "step": 280 + }, + { + "epoch": 0.51, + "learning_rate": 4.958591079872667e-06, + "loss": 0.1003, + "step": 290 + }, + { + "epoch": 0.53, + "learning_rate": 4.682741256981922e-06, + "loss": 0.1757, + "step": 300 + }, + { + "epoch": 0.54, + "learning_rate": 4.407858327239952e-06, + "loss": 0.1151, + "step": 310 + }, + { + "epoch": 0.56, + "learning_rate": 4.134780037209563e-06, + "loss": 0.1124, + "step": 320 + }, + { + "epoch": 0.58, + "learning_rate": 3.864338633545956e-06, + "loss": 0.0899, + "step": 330 + }, + { + "epoch": 0.6, + "learning_rate": 3.597358326601413e-06, + "loss": 0.1251, + "step": 340 + }, + { + "epoch": 0.61, + "learning_rate": 3.334652778521813e-06, + "loss": 0.171, + "step": 350 + }, + { + "epoch": 0.63, + "learning_rate": 3.077022623490371e-06, + "loss": 0.1447, + "step": 360 + }, + { + "epoch": 0.65, + "learning_rate": 2.825253027676026e-06, + "loss": 0.1192, + "step": 370 + }, + { + "epoch": 0.67, + "learning_rate": 2.580111296322904e-06, + "loss": 0.1158, + "step": 380 + }, + { + "epoch": 0.68, + "learning_rate": 2.342344535273608e-06, + "loss": 0.1028, + "step": 390 + }, + { + "epoch": 0.7, + "learning_rate": 2.112677374053164e-06, + "loss": 0.1171, + "step": 400 + }, + { + "epoch": 0.72, + "learning_rate": 1.8918097574529193e-06, + "loss": 0.1017, + "step": 410 + }, + { + "epoch": 0.74, + "learning_rate": 1.68041481234479e-06, + "loss": 0.0763, + "step": 420 + }, + { + "epoch": 0.76, + "learning_rate": 1.4791367962271425e-06, + "loss": 0.1185, + "step": 430 + }, + { + "epoch": 0.77, + "learning_rate": 1.2885891337543539e-06, + "loss": 0.0701, + "step": 440 + }, + { + "epoch": 0.79, + "learning_rate": 1.1093525472340471e-06, + "loss": 0.0873, + "step": 450 + }, + { + "epoch": 0.81, + "learning_rate": 9.419732867896048e-07, + "loss": 0.127, + "step": 460 + }, + { + "epoch": 0.83, + "learning_rate": 7.869614655817576e-07, + "loss": 0.1289, + "step": 470 + }, + { + "epoch": 0.84, + "learning_rate": 6.44789505162955e-07, + "loss": 0.1211, + "step": 480 + }, + { + "epoch": 0.86, + "learning_rate": 5.158906957025079e-07, + "loss": 0.094, + "step": 490 + }, + { + "epoch": 0.88, + "learning_rate": 4.0065787547042543e-07, + "loss": 0.09, + "step": 500 + }, + { + "epoch": 0.9, + "learning_rate": 2.994422336044345e-07, + "loss": 0.1208, + "step": 510 + }, + { + "epoch": 0.91, + "learning_rate": 2.1255223980891027e-07, + "loss": 0.0839, + "step": 520 + }, + { + "epoch": 0.93, + "learning_rate": 1.402527042476276e-07, + "loss": 0.0934, + "step": 530 + }, + { + "epoch": 0.95, + "learning_rate": 8.276397049545359e-08, + "loss": 0.094, + "step": 540 + }, + { + "epoch": 0.97, + "learning_rate": 4.026124400856479e-08, + "loss": 0.0984, + "step": 550 + }, + { + "epoch": 0.98, + "learning_rate": 1.2874058159796366e-08, + "loss": 0.0783, + "step": 560 + }, + { + "epoch": 1.0, + "step": 569, + "total_flos": 0.0, + "train_loss": 0.21165546916281192, + "train_runtime": 6592.6141, + "train_samples_per_second": 5.528, + "train_steps_per_second": 0.086 + } + ], + "max_steps": 569, + "num_train_epochs": 1, + "total_flos": 0.0, + "trial_name": null, + "trial_params": null +} diff --git a/rm-lora/training_args.bin b/rm-lora/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..d329ecd4f19063c5d16489af21f6840b27b96beb --- /dev/null +++ b/rm-lora/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9721221201616afd6cd70c678b34100cc9bfc8a766c143b6197ce3d08c049687 +size 3271 diff --git a/rm-lora/training_loss.png b/rm-lora/training_loss.png new file mode 100644 index 0000000000000000000000000000000000000000..43695c27849f92f7bfb868d2f95e87333f4fc9c9 Binary files /dev/null and b/rm-lora/training_loss.png differ diff --git a/rm-lora/value_head.bin b/rm-lora/value_head.bin new file mode 100644 index 0000000000000000000000000000000000000000..562bae81fdcd18b9044855778db9d48f99de0b82 --- /dev/null +++ b/rm-lora/value_head.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a3e9ff7365afb5700eb56adc47113942dd77a4d792c28baa2438f4dbc318916 +size 21491 diff --git a/sft-lora/README.md b/sft-lora/README.md new file mode 100644 index 0000000000000000000000000000000000000000..d290c902d52b2091d490255d35c9be86df84f437 --- /dev/null +++ b/sft-lora/README.md @@ -0,0 +1,3 @@ +--- +library_name: peft +--- diff --git a/sft-lora/adapter_config.json b/sft-lora/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..2ef4676864a7f782259cd6700dcab8059e8973ab --- /dev/null +++ b/sft-lora/adapter_config.json @@ -0,0 +1,20 @@ +{ + "base_model_name_or_path": "llama-13b-hf/", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layers_pattern": null, + "layers_to_transform": null, + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "revision": null, + "target_modules": [ + "q_proj", + "v_proj" + ], + "task_type": "CAUSAL_LM" +} \ No newline at end of file diff --git a/sft-lora/adapter_model.bin b/sft-lora/adapter_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..94aa4bf44c0902393f9de0762ab8ccf4180bd5d7 --- /dev/null +++ b/sft-lora/adapter_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84cf9e598366adf9b8511f973b4d1c5584ed8571f2abbafb990ddf99b3db0df7 +size 26269517 diff --git a/sft-lora/all_results.json b/sft-lora/all_results.json new file mode 100644 index 0000000000000000000000000000000000000000..04c7e4f99f6e15df1ed565949ba52b8573052183 --- /dev/null +++ b/sft-lora/all_results.json @@ -0,0 +1,7 @@ +{ + "epoch": 2.0, + "train_loss": 0.819440008492324, + "train_runtime": 68529.0816, + "train_samples_per_second": 6.597, + "train_steps_per_second": 0.103 +} \ No newline at end of file diff --git a/sft-lora/checkpoint-1000/README.md b/sft-lora/checkpoint-1000/README.md new file mode 100644 index 0000000000000000000000000000000000000000..d290c902d52b2091d490255d35c9be86df84f437 --- /dev/null +++ b/sft-lora/checkpoint-1000/README.md @@ -0,0 +1,3 @@ +--- +library_name: peft +--- diff --git a/sft-lora/checkpoint-1000/adapter_config.json b/sft-lora/checkpoint-1000/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..2ef4676864a7f782259cd6700dcab8059e8973ab --- /dev/null +++ b/sft-lora/checkpoint-1000/adapter_config.json @@ -0,0 +1,20 @@ +{ + "base_model_name_or_path": "llama-13b-hf/", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layers_pattern": null, + "layers_to_transform": null, + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "revision": null, + "target_modules": [ + "q_proj", + "v_proj" + ], + "task_type": "CAUSAL_LM" +} \ No newline at end of file diff --git a/sft-lora/checkpoint-1000/adapter_model.bin b/sft-lora/checkpoint-1000/adapter_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..0105564b7bcbed5241c1e00d027cfe8c467c1512 --- /dev/null +++ b/sft-lora/checkpoint-1000/adapter_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49166d1be828a038edfdd1f95fbeefe4e927fdb47b8797f273a0e274e074cc54 +size 26269517 diff --git a/sft-lora/checkpoint-1000/finetuning_args.json b/sft-lora/checkpoint-1000/finetuning_args.json new file mode 100644 index 0000000000000000000000000000000000000000..36a921b3eb84159ad54e7697e9d7d3e2fde38fec --- /dev/null +++ b/sft-lora/checkpoint-1000/finetuning_args.json @@ -0,0 +1,13 @@ +{ + "finetuning_type": "lora", + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "lora_rank": 8, + "lora_target": [ + "q_proj", + "v_proj" + ], + "name_module_trainable": "mlp", + "num_hidden_layers": 32, + "num_layer_trainable": 3 +} diff --git a/sft-lora/checkpoint-1000/optimizer.pt b/sft-lora/checkpoint-1000/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..cae2d0ea5cff8aef7ae6e5d70c235675f1ba90a6 --- /dev/null +++ b/sft-lora/checkpoint-1000/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:563d3c3905c63cedd152ff2795501dd2840392bc2c9d5be494f972be531f671b +size 52562821 diff --git a/sft-lora/checkpoint-1000/rng_state_0.pth b/sft-lora/checkpoint-1000/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..e53764928430fe7114703f2645e078a66de956ac --- /dev/null +++ b/sft-lora/checkpoint-1000/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1861187ed29864a34a274819277748606c140a8a54f9855b4010d1a3b1262252 +size 18679 diff --git a/sft-lora/checkpoint-1000/rng_state_1.pth b/sft-lora/checkpoint-1000/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..f0668465d157684b4930a2b5cbc0e928dc663b72 --- /dev/null +++ b/sft-lora/checkpoint-1000/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df1a43a503c0c1cef10b6406a484cd1cc4786ea475b7a565189f777cc2921d11 +size 18679 diff --git a/sft-lora/checkpoint-1000/rng_state_2.pth b/sft-lora/checkpoint-1000/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..94781b4230eb7319a97e2dc109ee14a5f452dcdd --- /dev/null +++ b/sft-lora/checkpoint-1000/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea8a5d9504efb5c0f487d4382ef1567e19039e679b4b3786908d3af7dd41db84 +size 18679 diff --git a/sft-lora/checkpoint-1000/rng_state_3.pth b/sft-lora/checkpoint-1000/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..8fef772262726c9870b9bdc274f09e6a03ec212d --- /dev/null +++ b/sft-lora/checkpoint-1000/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05670d089596e2c7f3408383b58b668b05e193e7533b3391b742d6e5b3f5aa2d +size 18679 diff --git a/sft-lora/checkpoint-1000/scheduler.pt b/sft-lora/checkpoint-1000/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..79aae0d92ca00e8feef41d32ee19e5bdc9d491c8 --- /dev/null +++ b/sft-lora/checkpoint-1000/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a591e3a265f45cc7ea1e1f12ab952409ddc4d51476e1e6e5b82f1289d6c35f2e +size 627 diff --git a/sft-lora/checkpoint-1000/trainer_state.json b/sft-lora/checkpoint-1000/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..a1a6748ec857e2223b554af52c6723e4533c60cd --- /dev/null +++ b/sft-lora/checkpoint-1000/trainer_state.json @@ -0,0 +1,616 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 0.28312570781426954, + "global_step": 1000, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.0, + "learning_rate": 4.9999752766303955e-05, + "loss": 1.293, + "step": 10 + }, + { + "epoch": 0.01, + "learning_rate": 4.999901107010577e-05, + "loss": 1.2584, + "step": 20 + }, + { + "epoch": 0.01, + "learning_rate": 4.999777492607524e-05, + "loss": 1.2075, + "step": 30 + }, + { + "epoch": 0.01, + "learning_rate": 4.9996044358661676e-05, + "loss": 1.1718, + "step": 40 + }, + { + "epoch": 0.01, + "learning_rate": 4.9993819402093446e-05, + "loss": 1.1483, + "step": 50 + }, + { + "epoch": 0.02, + "learning_rate": 4.999110010037728e-05, + "loss": 1.122, + "step": 60 + }, + { + "epoch": 0.02, + "learning_rate": 4.998788650729743e-05, + "loss": 1.0971, + "step": 70 + }, + { + "epoch": 0.02, + "learning_rate": 4.998417868641457e-05, + "loss": 1.0756, + "step": 80 + }, + { + "epoch": 0.03, + "learning_rate": 4.9979976711064556e-05, + "loss": 1.0673, + "step": 90 + }, + { + "epoch": 0.03, + "learning_rate": 4.9975280664357e-05, + "loss": 1.0705, + "step": 100 + }, + { + "epoch": 0.03, + "learning_rate": 4.997009063917356e-05, + "loss": 1.0673, + "step": 110 + }, + { + "epoch": 0.03, + "learning_rate": 4.996440673816617e-05, + "loss": 1.031, + "step": 120 + }, + { + "epoch": 0.04, + "learning_rate": 4.995822907375498e-05, + "loss": 1.0383, + "step": 130 + }, + { + "epoch": 0.04, + "learning_rate": 4.9951557768126136e-05, + "loss": 1.0097, + "step": 140 + }, + { + "epoch": 0.04, + "learning_rate": 4.9944392953229365e-05, + "loss": 1.012, + "step": 150 + }, + { + "epoch": 0.05, + "learning_rate": 4.993673477077535e-05, + "loss": 0.9834, + "step": 160 + }, + { + "epoch": 0.05, + "learning_rate": 4.9928583372232954e-05, + "loss": 0.9908, + "step": 170 + }, + { + "epoch": 0.05, + "learning_rate": 4.991993891882622e-05, + "loss": 0.9908, + "step": 180 + }, + { + "epoch": 0.05, + "learning_rate": 4.991080158153115e-05, + "loss": 0.9913, + "step": 190 + }, + { + "epoch": 0.06, + "learning_rate": 4.990117154107236e-05, + "loss": 0.9782, + "step": 200 + }, + { + "epoch": 0.06, + "learning_rate": 4.989104898791949e-05, + "loss": 0.9954, + "step": 210 + }, + { + "epoch": 0.06, + "learning_rate": 4.988043412228343e-05, + "loss": 0.975, + "step": 220 + }, + { + "epoch": 0.07, + "learning_rate": 4.986932715411239e-05, + "loss": 0.9687, + "step": 230 + }, + { + "epoch": 0.07, + "learning_rate": 4.985772830308771e-05, + "loss": 0.9677, + "step": 240 + }, + { + "epoch": 0.07, + "learning_rate": 4.9845637798619536e-05, + "loss": 0.9715, + "step": 250 + }, + { + "epoch": 0.07, + "learning_rate": 4.983305587984227e-05, + "loss": 0.9692, + "step": 260 + }, + { + "epoch": 0.08, + "learning_rate": 4.981998279560986e-05, + "loss": 0.9627, + "step": 270 + }, + { + "epoch": 0.08, + "learning_rate": 4.980641880449086e-05, + "loss": 0.9784, + "step": 280 + }, + { + "epoch": 0.08, + "learning_rate": 4.9792364174763323e-05, + "loss": 0.941, + "step": 290 + }, + { + "epoch": 0.08, + "learning_rate": 4.977781918440949e-05, + "loss": 0.9623, + "step": 300 + }, + { + "epoch": 0.09, + "learning_rate": 4.97627841211103e-05, + "loss": 0.9401, + "step": 310 + }, + { + "epoch": 0.09, + "learning_rate": 4.97472592822397e-05, + "loss": 0.9152, + "step": 320 + }, + { + "epoch": 0.09, + "learning_rate": 4.9731244974858746e-05, + "loss": 0.9405, + "step": 330 + }, + { + "epoch": 0.1, + "learning_rate": 4.971474151570955e-05, + "loss": 0.9431, + "step": 340 + }, + { + "epoch": 0.1, + "learning_rate": 4.9697749231209025e-05, + "loss": 0.9512, + "step": 350 + }, + { + "epoch": 0.1, + "learning_rate": 4.968026845744237e-05, + "loss": 0.9301, + "step": 360 + }, + { + "epoch": 0.1, + "learning_rate": 4.96622995401565e-05, + "loss": 0.917, + "step": 370 + }, + { + "epoch": 0.11, + "learning_rate": 4.9643842834753174e-05, + "loss": 0.9162, + "step": 380 + }, + { + "epoch": 0.11, + "learning_rate": 4.962489870628193e-05, + "loss": 0.9207, + "step": 390 + }, + { + "epoch": 0.11, + "learning_rate": 4.960546752943294e-05, + "loss": 0.924, + "step": 400 + }, + { + "epoch": 0.12, + "learning_rate": 4.958554968852952e-05, + "loss": 0.9025, + "step": 410 + }, + { + "epoch": 0.12, + "learning_rate": 4.95651455775206e-05, + "loss": 0.9027, + "step": 420 + }, + { + "epoch": 0.12, + "learning_rate": 4.954425559997287e-05, + "loss": 0.9167, + "step": 430 + }, + { + "epoch": 0.12, + "learning_rate": 4.952288016906284e-05, + "loss": 0.9119, + "step": 440 + }, + { + "epoch": 0.13, + "learning_rate": 4.9501019707568665e-05, + "loss": 0.9042, + "step": 450 + }, + { + "epoch": 0.13, + "learning_rate": 4.947867464786174e-05, + "loss": 0.9113, + "step": 460 + }, + { + "epoch": 0.13, + "learning_rate": 4.945584543189823e-05, + "loss": 0.9297, + "step": 470 + }, + { + "epoch": 0.14, + "learning_rate": 4.943253251121022e-05, + "loss": 0.9194, + "step": 480 + }, + { + "epoch": 0.14, + "learning_rate": 4.9408736346896894e-05, + "loss": 0.8978, + "step": 490 + }, + { + "epoch": 0.14, + "learning_rate": 4.938445740961534e-05, + "loss": 0.9217, + "step": 500 + }, + { + "epoch": 0.14, + "learning_rate": 4.935969617957126e-05, + "loss": 0.8997, + "step": 510 + }, + { + "epoch": 0.15, + "learning_rate": 4.93344531465095e-05, + "loss": 0.9045, + "step": 520 + }, + { + "epoch": 0.15, + "learning_rate": 4.930872880970432e-05, + "loss": 0.8985, + "step": 530 + }, + { + "epoch": 0.15, + "learning_rate": 4.9282523677949556e-05, + "loss": 0.9171, + "step": 540 + }, + { + "epoch": 0.16, + "learning_rate": 4.9255838269548524e-05, + "loss": 0.9001, + "step": 550 + }, + { + "epoch": 0.16, + "learning_rate": 4.9228673112303814e-05, + "loss": 0.8824, + "step": 560 + }, + { + "epoch": 0.16, + "learning_rate": 4.9201028743506794e-05, + "loss": 0.9046, + "step": 570 + }, + { + "epoch": 0.16, + "learning_rate": 4.917290570992702e-05, + "loss": 0.8888, + "step": 580 + }, + { + "epoch": 0.17, + "learning_rate": 4.9144304567801415e-05, + "loss": 0.889, + "step": 590 + }, + { + "epoch": 0.17, + "learning_rate": 4.911522588282327e-05, + "loss": 0.906, + "step": 600 + }, + { + "epoch": 0.17, + "learning_rate": 4.908567023013104e-05, + "loss": 0.8858, + "step": 610 + }, + { + "epoch": 0.18, + "learning_rate": 4.9055638194296994e-05, + "loss": 0.8862, + "step": 620 + }, + { + "epoch": 0.18, + "learning_rate": 4.902513036931562e-05, + "loss": 0.8983, + "step": 630 + }, + { + "epoch": 0.18, + "learning_rate": 4.89941473585919e-05, + "loss": 0.8967, + "step": 640 + }, + { + "epoch": 0.18, + "learning_rate": 4.89626897749294e-05, + "loss": 0.8925, + "step": 650 + }, + { + "epoch": 0.19, + "learning_rate": 4.893075824051807e-05, + "loss": 0.883, + "step": 660 + }, + { + "epoch": 0.19, + "learning_rate": 4.889835338692201e-05, + "loss": 0.8823, + "step": 670 + }, + { + "epoch": 0.19, + "learning_rate": 4.886547585506698e-05, + "loss": 0.8937, + "step": 680 + }, + { + "epoch": 0.2, + "learning_rate": 4.8832126295227656e-05, + "loss": 0.8695, + "step": 690 + }, + { + "epoch": 0.2, + "learning_rate": 4.879830536701485e-05, + "loss": 0.8873, + "step": 700 + }, + { + "epoch": 0.2, + "learning_rate": 4.876401373936239e-05, + "loss": 0.8862, + "step": 710 + }, + { + "epoch": 0.2, + "learning_rate": 4.8729252090513964e-05, + "loss": 0.874, + "step": 720 + }, + { + "epoch": 0.21, + "learning_rate": 4.869402110800963e-05, + "loss": 0.8834, + "step": 730 + }, + { + "epoch": 0.21, + "learning_rate": 4.865832148867228e-05, + "loss": 0.8744, + "step": 740 + }, + { + "epoch": 0.21, + "learning_rate": 4.8622153938593816e-05, + "loss": 0.876, + "step": 750 + }, + { + "epoch": 0.22, + "learning_rate": 4.8585519173121205e-05, + "loss": 0.8874, + "step": 760 + }, + { + "epoch": 0.22, + "learning_rate": 4.8548417916842324e-05, + "loss": 0.8938, + "step": 770 + }, + { + "epoch": 0.22, + "learning_rate": 4.851085090357163e-05, + "loss": 0.8855, + "step": 780 + }, + { + "epoch": 0.22, + "learning_rate": 4.847281887633565e-05, + "loss": 0.8827, + "step": 790 + }, + { + "epoch": 0.23, + "learning_rate": 4.843432258735827e-05, + "loss": 0.8736, + "step": 800 + }, + { + "epoch": 0.23, + "learning_rate": 4.839536279804589e-05, + "loss": 0.8907, + "step": 810 + }, + { + "epoch": 0.23, + "learning_rate": 4.835594027897231e-05, + "loss": 0.862, + "step": 820 + }, + { + "epoch": 0.23, + "learning_rate": 4.831605580986355e-05, + "loss": 0.8796, + "step": 830 + }, + { + "epoch": 0.24, + "learning_rate": 4.8275710179582366e-05, + "loss": 0.8745, + "step": 840 + }, + { + "epoch": 0.24, + "learning_rate": 4.823490418611273e-05, + "loss": 0.8594, + "step": 850 + }, + { + "epoch": 0.24, + "learning_rate": 4.819363863654395e-05, + "loss": 0.8839, + "step": 860 + }, + { + "epoch": 0.25, + "learning_rate": 4.8151914347054776e-05, + "loss": 0.8536, + "step": 870 + }, + { + "epoch": 0.25, + "learning_rate": 4.810973214289724e-05, + "loss": 0.8765, + "step": 880 + }, + { + "epoch": 0.25, + "learning_rate": 4.806709285838031e-05, + "loss": 0.8726, + "step": 890 + }, + { + "epoch": 0.25, + "learning_rate": 4.8023997336853434e-05, + "loss": 0.8664, + "step": 900 + }, + { + "epoch": 0.26, + "learning_rate": 4.7980446430689804e-05, + "loss": 0.8805, + "step": 910 + }, + { + "epoch": 0.26, + "learning_rate": 4.793644100126954e-05, + "loss": 0.878, + "step": 920 + }, + { + "epoch": 0.26, + "learning_rate": 4.7891981918962656e-05, + "loss": 0.8632, + "step": 930 + }, + { + "epoch": 0.27, + "learning_rate": 4.784707006311179e-05, + "loss": 0.8614, + "step": 940 + }, + { + "epoch": 0.27, + "learning_rate": 4.780170632201487e-05, + "loss": 0.8629, + "step": 950 + }, + { + "epoch": 0.27, + "learning_rate": 4.7755891592907556e-05, + "loss": 0.8635, + "step": 960 + }, + { + "epoch": 0.27, + "learning_rate": 4.7709626781945397e-05, + "loss": 0.8525, + "step": 970 + }, + { + "epoch": 0.28, + "learning_rate": 4.766291280418603e-05, + "loss": 0.8592, + "step": 980 + }, + { + "epoch": 0.28, + "learning_rate": 4.761575058357101e-05, + "loss": 0.8621, + "step": 990 + }, + { + "epoch": 0.28, + "learning_rate": 4.756814105290753e-05, + "loss": 0.8687, + "step": 1000 + } + ], + "max_steps": 7064, + "num_train_epochs": 2, + "total_flos": 3.539384062886019e+18, + "trial_name": null, + "trial_params": null +} diff --git a/sft-lora/checkpoint-1000/training_args.bin b/sft-lora/checkpoint-1000/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..3eed0ff4867b1994122fd7acbeae2361d0d3b65f --- /dev/null +++ b/sft-lora/checkpoint-1000/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f9990bd8d9bf61dcf0d79a1a831b0934c6cc3a114d136458fc4cdd6dc2a9387 +size 3272 diff --git a/sft-lora/checkpoint-2000/README.md b/sft-lora/checkpoint-2000/README.md new file mode 100644 index 0000000000000000000000000000000000000000..d290c902d52b2091d490255d35c9be86df84f437 --- /dev/null +++ b/sft-lora/checkpoint-2000/README.md @@ -0,0 +1,3 @@ +--- +library_name: peft +--- diff --git a/sft-lora/checkpoint-2000/adapter_config.json b/sft-lora/checkpoint-2000/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..2ef4676864a7f782259cd6700dcab8059e8973ab --- /dev/null +++ b/sft-lora/checkpoint-2000/adapter_config.json @@ -0,0 +1,20 @@ +{ + "base_model_name_or_path": "llama-13b-hf/", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layers_pattern": null, + "layers_to_transform": null, + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "revision": null, + "target_modules": [ + "q_proj", + "v_proj" + ], + "task_type": "CAUSAL_LM" +} \ No newline at end of file diff --git a/sft-lora/checkpoint-2000/adapter_model.bin b/sft-lora/checkpoint-2000/adapter_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..6da61d385b9cd331e573c3f1d15e57fdb118cc51 --- /dev/null +++ b/sft-lora/checkpoint-2000/adapter_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f6f135623dda22e316f833ef5f7c2e7a5465fd3313464ab89d0f3e60a3890e2 +size 26269517 diff --git a/sft-lora/checkpoint-2000/finetuning_args.json b/sft-lora/checkpoint-2000/finetuning_args.json new file mode 100644 index 0000000000000000000000000000000000000000..36a921b3eb84159ad54e7697e9d7d3e2fde38fec --- /dev/null +++ b/sft-lora/checkpoint-2000/finetuning_args.json @@ -0,0 +1,13 @@ +{ + "finetuning_type": "lora", + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "lora_rank": 8, + "lora_target": [ + "q_proj", + "v_proj" + ], + "name_module_trainable": "mlp", + "num_hidden_layers": 32, + "num_layer_trainable": 3 +} diff --git a/sft-lora/checkpoint-2000/optimizer.pt b/sft-lora/checkpoint-2000/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d2f0a46a7a9e0e02855fdc192015b68fb6733f2 --- /dev/null +++ b/sft-lora/checkpoint-2000/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e397c188ac6fcbd66336193ccfeb238d1a53bbfb79b7c21b8b238acfbf0d7ea +size 52562821 diff --git a/sft-lora/checkpoint-2000/rng_state_0.pth b/sft-lora/checkpoint-2000/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..49df96d969c916b860405c00c88024ca09bcf369 --- /dev/null +++ b/sft-lora/checkpoint-2000/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7465f2ce05639a998be3048ae8b2b3ddc511bd8df0ac0af63a4781d83ba13d1 +size 18679 diff --git a/sft-lora/checkpoint-2000/rng_state_1.pth b/sft-lora/checkpoint-2000/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..cefe4e53c0b772e71fcb83f33003393cea0b087e --- /dev/null +++ b/sft-lora/checkpoint-2000/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ee3a01821de7105bb38914d05f567f5ca9005a475248f6ff57a994dda760946 +size 18679 diff --git a/sft-lora/checkpoint-2000/rng_state_2.pth b/sft-lora/checkpoint-2000/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..0216babc382454d6b6ee1c14da388ffb76d01769 --- /dev/null +++ b/sft-lora/checkpoint-2000/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22f7328df9304c13f5f3ac9062a268875c9d2eb34607511e75df0f729cd3e462 +size 18679 diff --git a/sft-lora/checkpoint-2000/rng_state_3.pth b/sft-lora/checkpoint-2000/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..aa2991275b5aeab5d5bbff85b8589eb48d78b93b --- /dev/null +++ b/sft-lora/checkpoint-2000/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:363a7b98f242c61426c18c7085f5f8d7a1a938e734adb4c74cdcb7e8c3a8f683 +size 18679 diff --git a/sft-lora/checkpoint-2000/scheduler.pt b/sft-lora/checkpoint-2000/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8f579a1bc205ecfd68870c1065bf18043c82ec1 --- /dev/null +++ b/sft-lora/checkpoint-2000/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7e63b0f7d224d36a047a120fdc989122c10ff555fd9e9271cc2a05e908022f9 +size 627 diff --git a/sft-lora/checkpoint-2000/trainer_state.json b/sft-lora/checkpoint-2000/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..c70e812532f39c56c5a6dc2ab11c3371dd0ef40f --- /dev/null +++ b/sft-lora/checkpoint-2000/trainer_state.json @@ -0,0 +1,1216 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 0.5662514156285391, + "global_step": 2000, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.0, + "learning_rate": 4.9999752766303955e-05, + "loss": 1.293, + "step": 10 + }, + { + "epoch": 0.01, + "learning_rate": 4.999901107010577e-05, + "loss": 1.2584, + "step": 20 + }, + { + "epoch": 0.01, + "learning_rate": 4.999777492607524e-05, + "loss": 1.2075, + "step": 30 + }, + { + "epoch": 0.01, + "learning_rate": 4.9996044358661676e-05, + "loss": 1.1718, + "step": 40 + }, + { + "epoch": 0.01, + "learning_rate": 4.9993819402093446e-05, + "loss": 1.1483, + "step": 50 + }, + { + "epoch": 0.02, + "learning_rate": 4.999110010037728e-05, + "loss": 1.122, + "step": 60 + }, + { + "epoch": 0.02, + "learning_rate": 4.998788650729743e-05, + "loss": 1.0971, + "step": 70 + }, + { + "epoch": 0.02, + "learning_rate": 4.998417868641457e-05, + "loss": 1.0756, + "step": 80 + }, + { + "epoch": 0.03, + "learning_rate": 4.9979976711064556e-05, + "loss": 1.0673, + "step": 90 + }, + { + "epoch": 0.03, + "learning_rate": 4.9975280664357e-05, + "loss": 1.0705, + "step": 100 + }, + { + "epoch": 0.03, + "learning_rate": 4.997009063917356e-05, + "loss": 1.0673, + "step": 110 + }, + { + "epoch": 0.03, + "learning_rate": 4.996440673816617e-05, + "loss": 1.031, + "step": 120 + }, + { + "epoch": 0.04, + "learning_rate": 4.995822907375498e-05, + "loss": 1.0383, + "step": 130 + }, + { + "epoch": 0.04, + "learning_rate": 4.9951557768126136e-05, + "loss": 1.0097, + "step": 140 + }, + { + "epoch": 0.04, + "learning_rate": 4.9944392953229365e-05, + "loss": 1.012, + "step": 150 + }, + { + "epoch": 0.05, + "learning_rate": 4.993673477077535e-05, + "loss": 0.9834, + "step": 160 + }, + { + "epoch": 0.05, + "learning_rate": 4.9928583372232954e-05, + "loss": 0.9908, + "step": 170 + }, + { + "epoch": 0.05, + "learning_rate": 4.991993891882622e-05, + "loss": 0.9908, + "step": 180 + }, + { + "epoch": 0.05, + "learning_rate": 4.991080158153115e-05, + "loss": 0.9913, + "step": 190 + }, + { + "epoch": 0.06, + "learning_rate": 4.990117154107236e-05, + "loss": 0.9782, + "step": 200 + }, + { + "epoch": 0.06, + "learning_rate": 4.989104898791949e-05, + "loss": 0.9954, + "step": 210 + }, + { + "epoch": 0.06, + "learning_rate": 4.988043412228343e-05, + "loss": 0.975, + "step": 220 + }, + { + "epoch": 0.07, + "learning_rate": 4.986932715411239e-05, + "loss": 0.9687, + "step": 230 + }, + { + "epoch": 0.07, + "learning_rate": 4.985772830308771e-05, + "loss": 0.9677, + "step": 240 + }, + { + "epoch": 0.07, + "learning_rate": 4.9845637798619536e-05, + "loss": 0.9715, + "step": 250 + }, + { + "epoch": 0.07, + "learning_rate": 4.983305587984227e-05, + "loss": 0.9692, + "step": 260 + }, + { + "epoch": 0.08, + "learning_rate": 4.981998279560986e-05, + "loss": 0.9627, + "step": 270 + }, + { + "epoch": 0.08, + "learning_rate": 4.980641880449086e-05, + "loss": 0.9784, + "step": 280 + }, + { + "epoch": 0.08, + "learning_rate": 4.9792364174763323e-05, + "loss": 0.941, + "step": 290 + }, + { + "epoch": 0.08, + "learning_rate": 4.977781918440949e-05, + "loss": 0.9623, + "step": 300 + }, + { + "epoch": 0.09, + "learning_rate": 4.97627841211103e-05, + "loss": 0.9401, + "step": 310 + }, + { + "epoch": 0.09, + "learning_rate": 4.97472592822397e-05, + "loss": 0.9152, + "step": 320 + }, + { + "epoch": 0.09, + "learning_rate": 4.9731244974858746e-05, + "loss": 0.9405, + "step": 330 + }, + { + "epoch": 0.1, + "learning_rate": 4.971474151570955e-05, + "loss": 0.9431, + "step": 340 + }, + { + "epoch": 0.1, + "learning_rate": 4.9697749231209025e-05, + "loss": 0.9512, + "step": 350 + }, + { + "epoch": 0.1, + "learning_rate": 4.968026845744237e-05, + "loss": 0.9301, + "step": 360 + }, + { + "epoch": 0.1, + "learning_rate": 4.96622995401565e-05, + "loss": 0.917, + "step": 370 + }, + { + "epoch": 0.11, + "learning_rate": 4.9643842834753174e-05, + "loss": 0.9162, + "step": 380 + }, + { + "epoch": 0.11, + "learning_rate": 4.962489870628193e-05, + "loss": 0.9207, + "step": 390 + }, + { + "epoch": 0.11, + "learning_rate": 4.960546752943294e-05, + "loss": 0.924, + "step": 400 + }, + { + "epoch": 0.12, + "learning_rate": 4.958554968852952e-05, + "loss": 0.9025, + "step": 410 + }, + { + "epoch": 0.12, + "learning_rate": 4.95651455775206e-05, + "loss": 0.9027, + "step": 420 + }, + { + "epoch": 0.12, + "learning_rate": 4.954425559997287e-05, + "loss": 0.9167, + "step": 430 + }, + { + "epoch": 0.12, + "learning_rate": 4.952288016906284e-05, + "loss": 0.9119, + "step": 440 + }, + { + "epoch": 0.13, + "learning_rate": 4.9501019707568665e-05, + "loss": 0.9042, + "step": 450 + }, + { + "epoch": 0.13, + "learning_rate": 4.947867464786174e-05, + "loss": 0.9113, + "step": 460 + }, + { + "epoch": 0.13, + "learning_rate": 4.945584543189823e-05, + "loss": 0.9297, + "step": 470 + }, + { + "epoch": 0.14, + "learning_rate": 4.943253251121022e-05, + "loss": 0.9194, + "step": 480 + }, + { + "epoch": 0.14, + "learning_rate": 4.9408736346896894e-05, + "loss": 0.8978, + "step": 490 + }, + { + "epoch": 0.14, + "learning_rate": 4.938445740961534e-05, + "loss": 0.9217, + "step": 500 + }, + { + "epoch": 0.14, + "learning_rate": 4.935969617957126e-05, + "loss": 0.8997, + "step": 510 + }, + { + "epoch": 0.15, + "learning_rate": 4.93344531465095e-05, + "loss": 0.9045, + "step": 520 + }, + { + "epoch": 0.15, + "learning_rate": 4.930872880970432e-05, + "loss": 0.8985, + "step": 530 + }, + { + "epoch": 0.15, + "learning_rate": 4.9282523677949556e-05, + "loss": 0.9171, + "step": 540 + }, + { + "epoch": 0.16, + "learning_rate": 4.9255838269548524e-05, + "loss": 0.9001, + "step": 550 + }, + { + "epoch": 0.16, + "learning_rate": 4.9228673112303814e-05, + "loss": 0.8824, + "step": 560 + }, + { + "epoch": 0.16, + "learning_rate": 4.9201028743506794e-05, + "loss": 0.9046, + "step": 570 + }, + { + "epoch": 0.16, + "learning_rate": 4.917290570992702e-05, + "loss": 0.8888, + "step": 580 + }, + { + "epoch": 0.17, + "learning_rate": 4.9144304567801415e-05, + "loss": 0.889, + "step": 590 + }, + { + "epoch": 0.17, + "learning_rate": 4.911522588282327e-05, + "loss": 0.906, + "step": 600 + }, + { + "epoch": 0.17, + "learning_rate": 4.908567023013104e-05, + "loss": 0.8858, + "step": 610 + }, + { + "epoch": 0.18, + "learning_rate": 4.9055638194296994e-05, + "loss": 0.8862, + "step": 620 + }, + { + "epoch": 0.18, + "learning_rate": 4.902513036931562e-05, + "loss": 0.8983, + "step": 630 + }, + { + "epoch": 0.18, + "learning_rate": 4.89941473585919e-05, + "loss": 0.8967, + "step": 640 + }, + { + "epoch": 0.18, + "learning_rate": 4.89626897749294e-05, + "loss": 0.8925, + "step": 650 + }, + { + "epoch": 0.19, + "learning_rate": 4.893075824051807e-05, + "loss": 0.883, + "step": 660 + }, + { + "epoch": 0.19, + "learning_rate": 4.889835338692201e-05, + "loss": 0.8823, + "step": 670 + }, + { + "epoch": 0.19, + "learning_rate": 4.886547585506698e-05, + "loss": 0.8937, + "step": 680 + }, + { + "epoch": 0.2, + "learning_rate": 4.8832126295227656e-05, + "loss": 0.8695, + "step": 690 + }, + { + "epoch": 0.2, + "learning_rate": 4.879830536701485e-05, + "loss": 0.8873, + "step": 700 + }, + { + "epoch": 0.2, + "learning_rate": 4.876401373936239e-05, + "loss": 0.8862, + "step": 710 + }, + { + "epoch": 0.2, + "learning_rate": 4.8729252090513964e-05, + "loss": 0.874, + "step": 720 + }, + { + "epoch": 0.21, + "learning_rate": 4.869402110800963e-05, + "loss": 0.8834, + "step": 730 + }, + { + "epoch": 0.21, + "learning_rate": 4.865832148867228e-05, + "loss": 0.8744, + "step": 740 + }, + { + "epoch": 0.21, + "learning_rate": 4.8622153938593816e-05, + "loss": 0.876, + "step": 750 + }, + { + "epoch": 0.22, + "learning_rate": 4.8585519173121205e-05, + "loss": 0.8874, + "step": 760 + }, + { + "epoch": 0.22, + "learning_rate": 4.8548417916842324e-05, + "loss": 0.8938, + "step": 770 + }, + { + "epoch": 0.22, + "learning_rate": 4.851085090357163e-05, + "loss": 0.8855, + "step": 780 + }, + { + "epoch": 0.22, + "learning_rate": 4.847281887633565e-05, + "loss": 0.8827, + "step": 790 + }, + { + "epoch": 0.23, + "learning_rate": 4.843432258735827e-05, + "loss": 0.8736, + "step": 800 + }, + { + "epoch": 0.23, + "learning_rate": 4.839536279804589e-05, + "loss": 0.8907, + "step": 810 + }, + { + "epoch": 0.23, + "learning_rate": 4.835594027897231e-05, + "loss": 0.862, + "step": 820 + }, + { + "epoch": 0.23, + "learning_rate": 4.831605580986355e-05, + "loss": 0.8796, + "step": 830 + }, + { + "epoch": 0.24, + "learning_rate": 4.8275710179582366e-05, + "loss": 0.8745, + "step": 840 + }, + { + "epoch": 0.24, + "learning_rate": 4.823490418611273e-05, + "loss": 0.8594, + "step": 850 + }, + { + "epoch": 0.24, + "learning_rate": 4.819363863654395e-05, + "loss": 0.8839, + "step": 860 + }, + { + "epoch": 0.25, + "learning_rate": 4.8151914347054776e-05, + "loss": 0.8536, + "step": 870 + }, + { + "epoch": 0.25, + "learning_rate": 4.810973214289724e-05, + "loss": 0.8765, + "step": 880 + }, + { + "epoch": 0.25, + "learning_rate": 4.806709285838031e-05, + "loss": 0.8726, + "step": 890 + }, + { + "epoch": 0.25, + "learning_rate": 4.8023997336853434e-05, + "loss": 0.8664, + "step": 900 + }, + { + "epoch": 0.26, + "learning_rate": 4.7980446430689804e-05, + "loss": 0.8805, + "step": 910 + }, + { + "epoch": 0.26, + "learning_rate": 4.793644100126954e-05, + "loss": 0.878, + "step": 920 + }, + { + "epoch": 0.26, + "learning_rate": 4.7891981918962656e-05, + "loss": 0.8632, + "step": 930 + }, + { + "epoch": 0.27, + "learning_rate": 4.784707006311179e-05, + "loss": 0.8614, + "step": 940 + }, + { + "epoch": 0.27, + "learning_rate": 4.780170632201487e-05, + "loss": 0.8629, + "step": 950 + }, + { + "epoch": 0.27, + "learning_rate": 4.7755891592907556e-05, + "loss": 0.8635, + "step": 960 + }, + { + "epoch": 0.27, + "learning_rate": 4.7709626781945397e-05, + "loss": 0.8525, + "step": 970 + }, + { + "epoch": 0.28, + "learning_rate": 4.766291280418603e-05, + "loss": 0.8592, + "step": 980 + }, + { + "epoch": 0.28, + "learning_rate": 4.761575058357101e-05, + "loss": 0.8621, + "step": 990 + }, + { + "epoch": 0.28, + "learning_rate": 4.756814105290753e-05, + "loss": 0.8687, + "step": 1000 + }, + { + "epoch": 0.29, + "learning_rate": 4.7520085153850014e-05, + "loss": 0.8524, + "step": 1010 + }, + { + "epoch": 0.29, + "learning_rate": 4.7471583836881476e-05, + "loss": 0.8687, + "step": 1020 + }, + { + "epoch": 0.29, + "learning_rate": 4.742263806129469e-05, + "loss": 0.8505, + "step": 1030 + }, + { + "epoch": 0.29, + "learning_rate": 4.737324879517326e-05, + "loss": 0.8754, + "step": 1040 + }, + { + "epoch": 0.3, + "learning_rate": 4.732341701537245e-05, + "loss": 0.8583, + "step": 1050 + }, + { + "epoch": 0.3, + "learning_rate": 4.727314370749988e-05, + "loss": 0.8698, + "step": 1060 + }, + { + "epoch": 0.3, + "learning_rate": 4.7222429865896e-05, + "loss": 0.8661, + "step": 1070 + }, + { + "epoch": 0.31, + "learning_rate": 4.717127649361444e-05, + "loss": 0.8574, + "step": 1080 + }, + { + "epoch": 0.31, + "learning_rate": 4.71196846024022e-05, + "loss": 0.852, + "step": 1090 + }, + { + "epoch": 0.31, + "learning_rate": 4.7067655212679585e-05, + "loss": 0.8619, + "step": 1100 + }, + { + "epoch": 0.31, + "learning_rate": 4.701518935352006e-05, + "loss": 0.8632, + "step": 1110 + }, + { + "epoch": 0.32, + "learning_rate": 4.69622880626299e-05, + "loss": 0.8529, + "step": 1120 + }, + { + "epoch": 0.32, + "learning_rate": 4.690895238632762e-05, + "loss": 0.8529, + "step": 1130 + }, + { + "epoch": 0.32, + "learning_rate": 4.685518337952335e-05, + "loss": 0.8465, + "step": 1140 + }, + { + "epoch": 0.33, + "learning_rate": 4.680098210569789e-05, + "loss": 0.8604, + "step": 1150 + }, + { + "epoch": 0.33, + "learning_rate": 4.674634963688177e-05, + "loss": 0.8649, + "step": 1160 + }, + { + "epoch": 0.33, + "learning_rate": 4.669128705363394e-05, + "loss": 0.8572, + "step": 1170 + }, + { + "epoch": 0.33, + "learning_rate": 4.663579544502049e-05, + "loss": 0.8634, + "step": 1180 + }, + { + "epoch": 0.34, + "learning_rate": 4.657987590859305e-05, + "loss": 0.8478, + "step": 1190 + }, + { + "epoch": 0.34, + "learning_rate": 4.652352955036713e-05, + "loss": 0.8475, + "step": 1200 + }, + { + "epoch": 0.34, + "learning_rate": 4.646675748480019e-05, + "loss": 0.8537, + "step": 1210 + }, + { + "epoch": 0.35, + "learning_rate": 4.640956083476964e-05, + "loss": 0.8499, + "step": 1220 + }, + { + "epoch": 0.35, + "learning_rate": 4.635194073155061e-05, + "loss": 0.8467, + "step": 1230 + }, + { + "epoch": 0.35, + "learning_rate": 4.62938983147936e-05, + "loss": 0.8538, + "step": 1240 + }, + { + "epoch": 0.35, + "learning_rate": 4.62354347325019e-05, + "loss": 0.8619, + "step": 1250 + }, + { + "epoch": 0.36, + "learning_rate": 4.6176551141008916e-05, + "loss": 0.8593, + "step": 1260 + }, + { + "epoch": 0.36, + "learning_rate": 4.611724870495528e-05, + "loss": 0.8484, + "step": 1270 + }, + { + "epoch": 0.36, + "learning_rate": 4.605752859726583e-05, + "loss": 0.8395, + "step": 1280 + }, + { + "epoch": 0.37, + "learning_rate": 4.5997391999126397e-05, + "loss": 0.8547, + "step": 1290 + }, + { + "epoch": 0.37, + "learning_rate": 4.5936840099960465e-05, + "loss": 0.8586, + "step": 1300 + }, + { + "epoch": 0.37, + "learning_rate": 4.587587409740561e-05, + "loss": 0.839, + "step": 1310 + }, + { + "epoch": 0.37, + "learning_rate": 4.581449519728986e-05, + "loss": 0.8417, + "step": 1320 + }, + { + "epoch": 0.38, + "learning_rate": 4.575270461360779e-05, + "loss": 0.8404, + "step": 1330 + }, + { + "epoch": 0.38, + "learning_rate": 4.569050356849655e-05, + "loss": 0.843, + "step": 1340 + }, + { + "epoch": 0.38, + "learning_rate": 4.562789329221169e-05, + "loss": 0.8557, + "step": 1350 + }, + { + "epoch": 0.39, + "learning_rate": 4.5564875023102796e-05, + "loss": 0.8504, + "step": 1360 + }, + { + "epoch": 0.39, + "learning_rate": 4.550145000758905e-05, + "loss": 0.8579, + "step": 1370 + }, + { + "epoch": 0.39, + "learning_rate": 4.543761950013453e-05, + "loss": 0.8563, + "step": 1380 + }, + { + "epoch": 0.39, + "learning_rate": 4.537338476322341e-05, + "loss": 0.8446, + "step": 1390 + }, + { + "epoch": 0.4, + "learning_rate": 4.530874706733502e-05, + "loss": 0.8524, + "step": 1400 + }, + { + "epoch": 0.4, + "learning_rate": 4.524370769091866e-05, + "loss": 0.8417, + "step": 1410 + }, + { + "epoch": 0.4, + "learning_rate": 4.5178267920368366e-05, + "loss": 0.8582, + "step": 1420 + }, + { + "epoch": 0.4, + "learning_rate": 4.511242904999746e-05, + "loss": 0.841, + "step": 1430 + }, + { + "epoch": 0.41, + "learning_rate": 4.50461923820129e-05, + "loss": 0.8529, + "step": 1440 + }, + { + "epoch": 0.41, + "learning_rate": 4.497955922648961e-05, + "loss": 0.8545, + "step": 1450 + }, + { + "epoch": 0.41, + "learning_rate": 4.491253090134447e-05, + "loss": 0.8471, + "step": 1460 + }, + { + "epoch": 0.42, + "learning_rate": 4.4845108732310355e-05, + "loss": 0.8379, + "step": 1470 + }, + { + "epoch": 0.42, + "learning_rate": 4.4777294052909804e-05, + "loss": 0.8542, + "step": 1480 + }, + { + "epoch": 0.42, + "learning_rate": 4.470908820442873e-05, + "loss": 0.8463, + "step": 1490 + }, + { + "epoch": 0.42, + "learning_rate": 4.464049253588985e-05, + "loss": 0.8362, + "step": 1500 + }, + { + "epoch": 0.43, + "learning_rate": 4.457150840402604e-05, + "loss": 0.8467, + "step": 1510 + }, + { + "epoch": 0.43, + "learning_rate": 4.450213717325343e-05, + "loss": 0.8501, + "step": 1520 + }, + { + "epoch": 0.43, + "learning_rate": 4.443238021564448e-05, + "loss": 0.8541, + "step": 1530 + }, + { + "epoch": 0.44, + "learning_rate": 4.4362238910900835e-05, + "loss": 0.8443, + "step": 1540 + }, + { + "epoch": 0.44, + "learning_rate": 4.4291714646326024e-05, + "loss": 0.8297, + "step": 1550 + }, + { + "epoch": 0.44, + "learning_rate": 4.4220808816797995e-05, + "loss": 0.8532, + "step": 1560 + }, + { + "epoch": 0.44, + "learning_rate": 4.414952282474158e-05, + "loss": 0.854, + "step": 1570 + }, + { + "epoch": 0.45, + "learning_rate": 4.407785808010073e-05, + "loss": 0.849, + "step": 1580 + }, + { + "epoch": 0.45, + "learning_rate": 4.400581600031062e-05, + "loss": 0.8516, + "step": 1590 + }, + { + "epoch": 0.45, + "learning_rate": 4.3933398010269614e-05, + "loss": 0.8394, + "step": 1600 + }, + { + "epoch": 0.46, + "learning_rate": 4.386060554231111e-05, + "loss": 0.8399, + "step": 1610 + }, + { + "epoch": 0.46, + "learning_rate": 4.378744003617517e-05, + "loss": 0.8242, + "step": 1620 + }, + { + "epoch": 0.46, + "learning_rate": 4.371390293898007e-05, + "loss": 0.8395, + "step": 1630 + }, + { + "epoch": 0.46, + "learning_rate": 4.3639995705193684e-05, + "loss": 0.8355, + "step": 1640 + }, + { + "epoch": 0.47, + "learning_rate": 4.3565719796604706e-05, + "loss": 0.8299, + "step": 1650 + }, + { + "epoch": 0.47, + "learning_rate": 4.3491076682293715e-05, + "loss": 0.8272, + "step": 1660 + }, + { + "epoch": 0.47, + "learning_rate": 4.341606783860416e-05, + "loss": 0.8336, + "step": 1670 + }, + { + "epoch": 0.48, + "learning_rate": 4.334069474911313e-05, + "loss": 0.8264, + "step": 1680 + }, + { + "epoch": 0.48, + "learning_rate": 4.326495890460204e-05, + "loss": 0.8381, + "step": 1690 + }, + { + "epoch": 0.48, + "learning_rate": 4.3188861803027094e-05, + "loss": 0.8278, + "step": 1700 + }, + { + "epoch": 0.48, + "learning_rate": 4.3112404949489715e-05, + "loss": 0.8458, + "step": 1710 + }, + { + "epoch": 0.49, + "learning_rate": 4.303558985620673e-05, + "loss": 0.8348, + "step": 1720 + }, + { + "epoch": 0.49, + "learning_rate": 4.2958418042480506e-05, + "loss": 0.814, + "step": 1730 + }, + { + "epoch": 0.49, + "learning_rate": 4.288089103466886e-05, + "loss": 0.838, + "step": 1740 + }, + { + "epoch": 0.5, + "learning_rate": 4.280301036615489e-05, + "loss": 0.824, + "step": 1750 + }, + { + "epoch": 0.5, + "learning_rate": 4.272477757731662e-05, + "loss": 0.8314, + "step": 1760 + }, + { + "epoch": 0.5, + "learning_rate": 4.2646194215496595e-05, + "loss": 0.821, + "step": 1770 + }, + { + "epoch": 0.5, + "learning_rate": 4.2567261834971206e-05, + "loss": 0.8311, + "step": 1780 + }, + { + "epoch": 0.51, + "learning_rate": 4.248798199691998e-05, + "loss": 0.8443, + "step": 1790 + }, + { + "epoch": 0.51, + "learning_rate": 4.2408356269394714e-05, + "loss": 0.8315, + "step": 1800 + }, + { + "epoch": 0.51, + "learning_rate": 4.2328386227288445e-05, + "loss": 0.8184, + "step": 1810 + }, + { + "epoch": 0.52, + "learning_rate": 4.224807345230429e-05, + "loss": 0.8364, + "step": 1820 + }, + { + "epoch": 0.52, + "learning_rate": 4.21674195329242e-05, + "loss": 0.8186, + "step": 1830 + }, + { + "epoch": 0.52, + "learning_rate": 4.208642606437748e-05, + "loss": 0.8454, + "step": 1840 + }, + { + "epoch": 0.52, + "learning_rate": 4.2005094648609325e-05, + "loss": 0.832, + "step": 1850 + }, + { + "epoch": 0.53, + "learning_rate": 4.192342689424903e-05, + "loss": 0.8027, + "step": 1860 + }, + { + "epoch": 0.53, + "learning_rate": 4.184142441657827e-05, + "loss": 0.8365, + "step": 1870 + }, + { + "epoch": 0.53, + "learning_rate": 4.1759088837499095e-05, + "loss": 0.8523, + "step": 1880 + }, + { + "epoch": 0.54, + "learning_rate": 4.167642178550186e-05, + "loss": 0.8377, + "step": 1890 + }, + { + "epoch": 0.54, + "learning_rate": 4.159342489563304e-05, + "loss": 0.8299, + "step": 1900 + }, + { + "epoch": 0.54, + "learning_rate": 4.151009980946287e-05, + "loss": 0.8273, + "step": 1910 + }, + { + "epoch": 0.54, + "learning_rate": 4.142644817505284e-05, + "loss": 0.813, + "step": 1920 + }, + { + "epoch": 0.55, + "learning_rate": 4.1342471646923196e-05, + "loss": 0.8262, + "step": 1930 + }, + { + "epoch": 0.55, + "learning_rate": 4.1258171886020124e-05, + "loss": 0.8258, + "step": 1940 + }, + { + "epoch": 0.55, + "learning_rate": 4.117355055968295e-05, + "loss": 0.8248, + "step": 1950 + }, + { + "epoch": 0.55, + "learning_rate": 4.1088609341611135e-05, + "loss": 0.8123, + "step": 1960 + }, + { + "epoch": 0.56, + "learning_rate": 4.1003349911831166e-05, + "loss": 0.8304, + "step": 1970 + }, + { + "epoch": 0.56, + "learning_rate": 4.091777395666338e-05, + "loss": 0.849, + "step": 1980 + }, + { + "epoch": 0.56, + "learning_rate": 4.0831883168688534e-05, + "loss": 0.8255, + "step": 1990 + }, + { + "epoch": 0.57, + "learning_rate": 4.07456792467144e-05, + "loss": 0.8317, + "step": 2000 + } + ], + "max_steps": 7064, + "num_train_epochs": 2, + "total_flos": 7.078895870984323e+18, + "trial_name": null, + "trial_params": null +} diff --git a/sft-lora/checkpoint-2000/training_args.bin b/sft-lora/checkpoint-2000/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..3eed0ff4867b1994122fd7acbeae2361d0d3b65f --- /dev/null +++ b/sft-lora/checkpoint-2000/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f9990bd8d9bf61dcf0d79a1a831b0934c6cc3a114d136458fc4cdd6dc2a9387 +size 3272 diff --git a/sft-lora/checkpoint-3000/README.md b/sft-lora/checkpoint-3000/README.md new file mode 100644 index 0000000000000000000000000000000000000000..d290c902d52b2091d490255d35c9be86df84f437 --- /dev/null +++ b/sft-lora/checkpoint-3000/README.md @@ -0,0 +1,3 @@ +--- +library_name: peft +--- diff --git a/sft-lora/checkpoint-3000/adapter_config.json b/sft-lora/checkpoint-3000/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..2ef4676864a7f782259cd6700dcab8059e8973ab --- /dev/null +++ b/sft-lora/checkpoint-3000/adapter_config.json @@ -0,0 +1,20 @@ +{ + "base_model_name_or_path": "llama-13b-hf/", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layers_pattern": null, + "layers_to_transform": null, + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "revision": null, + "target_modules": [ + "q_proj", + "v_proj" + ], + "task_type": "CAUSAL_LM" +} \ No newline at end of file diff --git a/sft-lora/checkpoint-3000/adapter_model.bin b/sft-lora/checkpoint-3000/adapter_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..c7ce98d1b8fd6f9625c281f7aae564b887dff1b1 --- /dev/null +++ b/sft-lora/checkpoint-3000/adapter_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8eef6f65255eded92df77e7c864129f28ade33fe379f269e884866ff92e3ad99 +size 26269517 diff --git a/sft-lora/checkpoint-3000/finetuning_args.json b/sft-lora/checkpoint-3000/finetuning_args.json new file mode 100644 index 0000000000000000000000000000000000000000..36a921b3eb84159ad54e7697e9d7d3e2fde38fec --- /dev/null +++ b/sft-lora/checkpoint-3000/finetuning_args.json @@ -0,0 +1,13 @@ +{ + "finetuning_type": "lora", + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "lora_rank": 8, + "lora_target": [ + "q_proj", + "v_proj" + ], + "name_module_trainable": "mlp", + "num_hidden_layers": 32, + "num_layer_trainable": 3 +} diff --git a/sft-lora/checkpoint-3000/optimizer.pt b/sft-lora/checkpoint-3000/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8c05e24658c3b346892c35f5340d08ea213bad7 --- /dev/null +++ b/sft-lora/checkpoint-3000/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f873335e077dee24ec772f15d53744f4967256c87b9c5e617c6e1423d713a90 +size 52562821 diff --git a/sft-lora/checkpoint-3000/rng_state_0.pth b/sft-lora/checkpoint-3000/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..b8452d3faaa8a76655031eba09ec2681ecaf0716 --- /dev/null +++ b/sft-lora/checkpoint-3000/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34a7eb5b8e8df77a28bae52aab0825bbf464c442823a918c8ab23ef65981e021 +size 18679 diff --git a/sft-lora/checkpoint-3000/rng_state_1.pth b/sft-lora/checkpoint-3000/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..5fb8d272d882b95fd4ce5c9569c3cd938d58e91b --- /dev/null +++ b/sft-lora/checkpoint-3000/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1631a5d40918fbf5f8ae222feb84849c1ede3edd65f16ee958ba249cf9aa97c +size 18679 diff --git a/sft-lora/checkpoint-3000/rng_state_2.pth b/sft-lora/checkpoint-3000/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..712a4258915fa36496ee996800a62762f6fe4091 --- /dev/null +++ b/sft-lora/checkpoint-3000/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed7eeef1946d7c0d7991d091de6cd19ddde849be1517808f4a188ce2b388d40d +size 18679 diff --git a/sft-lora/checkpoint-3000/rng_state_3.pth b/sft-lora/checkpoint-3000/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..523092e5605a432b13312e5ea1a01056523855ff --- /dev/null +++ b/sft-lora/checkpoint-3000/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7daeb6aa713d94eb58a4d49781817819edcb074368e56ca383283dd59f60ce0b +size 18679 diff --git a/sft-lora/checkpoint-3000/scheduler.pt b/sft-lora/checkpoint-3000/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..23c3cbe8a05547e4b38f4612b48acd2e829c9ecf --- /dev/null +++ b/sft-lora/checkpoint-3000/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93b3f6531267b4bdbf5a6a0db75b0e9169e561b588905320233f1373d13e9940 +size 627 diff --git a/sft-lora/checkpoint-3000/trainer_state.json b/sft-lora/checkpoint-3000/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..856cbbbd891f811e0ff67a4ad8d5e2e6d98a885e --- /dev/null +++ b/sft-lora/checkpoint-3000/trainer_state.json @@ -0,0 +1,1816 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 0.8493771234428086, + "global_step": 3000, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.0, + "learning_rate": 4.9999752766303955e-05, + "loss": 1.293, + "step": 10 + }, + { + "epoch": 0.01, + "learning_rate": 4.999901107010577e-05, + "loss": 1.2584, + "step": 20 + }, + { + "epoch": 0.01, + "learning_rate": 4.999777492607524e-05, + "loss": 1.2075, + "step": 30 + }, + { + "epoch": 0.01, + "learning_rate": 4.9996044358661676e-05, + "loss": 1.1718, + "step": 40 + }, + { + "epoch": 0.01, + "learning_rate": 4.9993819402093446e-05, + "loss": 1.1483, + "step": 50 + }, + { + "epoch": 0.02, + "learning_rate": 4.999110010037728e-05, + "loss": 1.122, + "step": 60 + }, + { + "epoch": 0.02, + "learning_rate": 4.998788650729743e-05, + "loss": 1.0971, + "step": 70 + }, + { + "epoch": 0.02, + "learning_rate": 4.998417868641457e-05, + "loss": 1.0756, + "step": 80 + }, + { + "epoch": 0.03, + "learning_rate": 4.9979976711064556e-05, + "loss": 1.0673, + "step": 90 + }, + { + "epoch": 0.03, + "learning_rate": 4.9975280664357e-05, + "loss": 1.0705, + "step": 100 + }, + { + "epoch": 0.03, + "learning_rate": 4.997009063917356e-05, + "loss": 1.0673, + "step": 110 + }, + { + "epoch": 0.03, + "learning_rate": 4.996440673816617e-05, + "loss": 1.031, + "step": 120 + }, + { + "epoch": 0.04, + "learning_rate": 4.995822907375498e-05, + "loss": 1.0383, + "step": 130 + }, + { + "epoch": 0.04, + "learning_rate": 4.9951557768126136e-05, + "loss": 1.0097, + "step": 140 + }, + { + "epoch": 0.04, + "learning_rate": 4.9944392953229365e-05, + "loss": 1.012, + "step": 150 + }, + { + "epoch": 0.05, + "learning_rate": 4.993673477077535e-05, + "loss": 0.9834, + "step": 160 + }, + { + "epoch": 0.05, + "learning_rate": 4.9928583372232954e-05, + "loss": 0.9908, + "step": 170 + }, + { + "epoch": 0.05, + "learning_rate": 4.991993891882622e-05, + "loss": 0.9908, + "step": 180 + }, + { + "epoch": 0.05, + "learning_rate": 4.991080158153115e-05, + "loss": 0.9913, + "step": 190 + }, + { + "epoch": 0.06, + "learning_rate": 4.990117154107236e-05, + "loss": 0.9782, + "step": 200 + }, + { + "epoch": 0.06, + "learning_rate": 4.989104898791949e-05, + "loss": 0.9954, + "step": 210 + }, + { + "epoch": 0.06, + "learning_rate": 4.988043412228343e-05, + "loss": 0.975, + "step": 220 + }, + { + "epoch": 0.07, + "learning_rate": 4.986932715411239e-05, + "loss": 0.9687, + "step": 230 + }, + { + "epoch": 0.07, + "learning_rate": 4.985772830308771e-05, + "loss": 0.9677, + "step": 240 + }, + { + "epoch": 0.07, + "learning_rate": 4.9845637798619536e-05, + "loss": 0.9715, + "step": 250 + }, + { + "epoch": 0.07, + "learning_rate": 4.983305587984227e-05, + "loss": 0.9692, + "step": 260 + }, + { + "epoch": 0.08, + "learning_rate": 4.981998279560986e-05, + "loss": 0.9627, + "step": 270 + }, + { + "epoch": 0.08, + "learning_rate": 4.980641880449086e-05, + "loss": 0.9784, + "step": 280 + }, + { + "epoch": 0.08, + "learning_rate": 4.9792364174763323e-05, + "loss": 0.941, + "step": 290 + }, + { + "epoch": 0.08, + "learning_rate": 4.977781918440949e-05, + "loss": 0.9623, + "step": 300 + }, + { + "epoch": 0.09, + "learning_rate": 4.97627841211103e-05, + "loss": 0.9401, + "step": 310 + }, + { + "epoch": 0.09, + "learning_rate": 4.97472592822397e-05, + "loss": 0.9152, + "step": 320 + }, + { + "epoch": 0.09, + "learning_rate": 4.9731244974858746e-05, + "loss": 0.9405, + "step": 330 + }, + { + "epoch": 0.1, + "learning_rate": 4.971474151570955e-05, + "loss": 0.9431, + "step": 340 + }, + { + "epoch": 0.1, + "learning_rate": 4.9697749231209025e-05, + "loss": 0.9512, + "step": 350 + }, + { + "epoch": 0.1, + "learning_rate": 4.968026845744237e-05, + "loss": 0.9301, + "step": 360 + }, + { + "epoch": 0.1, + "learning_rate": 4.96622995401565e-05, + "loss": 0.917, + "step": 370 + }, + { + "epoch": 0.11, + "learning_rate": 4.9643842834753174e-05, + "loss": 0.9162, + "step": 380 + }, + { + "epoch": 0.11, + "learning_rate": 4.962489870628193e-05, + "loss": 0.9207, + "step": 390 + }, + { + "epoch": 0.11, + "learning_rate": 4.960546752943294e-05, + "loss": 0.924, + "step": 400 + }, + { + "epoch": 0.12, + "learning_rate": 4.958554968852952e-05, + "loss": 0.9025, + "step": 410 + }, + { + "epoch": 0.12, + "learning_rate": 4.95651455775206e-05, + "loss": 0.9027, + "step": 420 + }, + { + "epoch": 0.12, + "learning_rate": 4.954425559997287e-05, + "loss": 0.9167, + "step": 430 + }, + { + "epoch": 0.12, + "learning_rate": 4.952288016906284e-05, + "loss": 0.9119, + "step": 440 + }, + { + "epoch": 0.13, + "learning_rate": 4.9501019707568665e-05, + "loss": 0.9042, + "step": 450 + }, + { + "epoch": 0.13, + "learning_rate": 4.947867464786174e-05, + "loss": 0.9113, + "step": 460 + }, + { + "epoch": 0.13, + "learning_rate": 4.945584543189823e-05, + "loss": 0.9297, + "step": 470 + }, + { + "epoch": 0.14, + "learning_rate": 4.943253251121022e-05, + "loss": 0.9194, + "step": 480 + }, + { + "epoch": 0.14, + "learning_rate": 4.9408736346896894e-05, + "loss": 0.8978, + "step": 490 + }, + { + "epoch": 0.14, + "learning_rate": 4.938445740961534e-05, + "loss": 0.9217, + "step": 500 + }, + { + "epoch": 0.14, + "learning_rate": 4.935969617957126e-05, + "loss": 0.8997, + "step": 510 + }, + { + "epoch": 0.15, + "learning_rate": 4.93344531465095e-05, + "loss": 0.9045, + "step": 520 + }, + { + "epoch": 0.15, + "learning_rate": 4.930872880970432e-05, + "loss": 0.8985, + "step": 530 + }, + { + "epoch": 0.15, + "learning_rate": 4.9282523677949556e-05, + "loss": 0.9171, + "step": 540 + }, + { + "epoch": 0.16, + "learning_rate": 4.9255838269548524e-05, + "loss": 0.9001, + "step": 550 + }, + { + "epoch": 0.16, + "learning_rate": 4.9228673112303814e-05, + "loss": 0.8824, + "step": 560 + }, + { + "epoch": 0.16, + "learning_rate": 4.9201028743506794e-05, + "loss": 0.9046, + "step": 570 + }, + { + "epoch": 0.16, + "learning_rate": 4.917290570992702e-05, + "loss": 0.8888, + "step": 580 + }, + { + "epoch": 0.17, + "learning_rate": 4.9144304567801415e-05, + "loss": 0.889, + "step": 590 + }, + { + "epoch": 0.17, + "learning_rate": 4.911522588282327e-05, + "loss": 0.906, + "step": 600 + }, + { + "epoch": 0.17, + "learning_rate": 4.908567023013104e-05, + "loss": 0.8858, + "step": 610 + }, + { + "epoch": 0.18, + "learning_rate": 4.9055638194296994e-05, + "loss": 0.8862, + "step": 620 + }, + { + "epoch": 0.18, + "learning_rate": 4.902513036931562e-05, + "loss": 0.8983, + "step": 630 + }, + { + "epoch": 0.18, + "learning_rate": 4.89941473585919e-05, + "loss": 0.8967, + "step": 640 + }, + { + "epoch": 0.18, + "learning_rate": 4.89626897749294e-05, + "loss": 0.8925, + "step": 650 + }, + { + "epoch": 0.19, + "learning_rate": 4.893075824051807e-05, + "loss": 0.883, + "step": 660 + }, + { + "epoch": 0.19, + "learning_rate": 4.889835338692201e-05, + "loss": 0.8823, + "step": 670 + }, + { + "epoch": 0.19, + "learning_rate": 4.886547585506698e-05, + "loss": 0.8937, + "step": 680 + }, + { + "epoch": 0.2, + "learning_rate": 4.8832126295227656e-05, + "loss": 0.8695, + "step": 690 + }, + { + "epoch": 0.2, + "learning_rate": 4.879830536701485e-05, + "loss": 0.8873, + "step": 700 + }, + { + "epoch": 0.2, + "learning_rate": 4.876401373936239e-05, + "loss": 0.8862, + "step": 710 + }, + { + "epoch": 0.2, + "learning_rate": 4.8729252090513964e-05, + "loss": 0.874, + "step": 720 + }, + { + "epoch": 0.21, + "learning_rate": 4.869402110800963e-05, + "loss": 0.8834, + "step": 730 + }, + { + "epoch": 0.21, + "learning_rate": 4.865832148867228e-05, + "loss": 0.8744, + "step": 740 + }, + { + "epoch": 0.21, + "learning_rate": 4.8622153938593816e-05, + "loss": 0.876, + "step": 750 + }, + { + "epoch": 0.22, + "learning_rate": 4.8585519173121205e-05, + "loss": 0.8874, + "step": 760 + }, + { + "epoch": 0.22, + "learning_rate": 4.8548417916842324e-05, + "loss": 0.8938, + "step": 770 + }, + { + "epoch": 0.22, + "learning_rate": 4.851085090357163e-05, + "loss": 0.8855, + "step": 780 + }, + { + "epoch": 0.22, + "learning_rate": 4.847281887633565e-05, + "loss": 0.8827, + "step": 790 + }, + { + "epoch": 0.23, + "learning_rate": 4.843432258735827e-05, + "loss": 0.8736, + "step": 800 + }, + { + "epoch": 0.23, + "learning_rate": 4.839536279804589e-05, + "loss": 0.8907, + "step": 810 + }, + { + "epoch": 0.23, + "learning_rate": 4.835594027897231e-05, + "loss": 0.862, + "step": 820 + }, + { + "epoch": 0.23, + "learning_rate": 4.831605580986355e-05, + "loss": 0.8796, + "step": 830 + }, + { + "epoch": 0.24, + "learning_rate": 4.8275710179582366e-05, + "loss": 0.8745, + "step": 840 + }, + { + "epoch": 0.24, + "learning_rate": 4.823490418611273e-05, + "loss": 0.8594, + "step": 850 + }, + { + "epoch": 0.24, + "learning_rate": 4.819363863654395e-05, + "loss": 0.8839, + "step": 860 + }, + { + "epoch": 0.25, + "learning_rate": 4.8151914347054776e-05, + "loss": 0.8536, + "step": 870 + }, + { + "epoch": 0.25, + "learning_rate": 4.810973214289724e-05, + "loss": 0.8765, + "step": 880 + }, + { + "epoch": 0.25, + "learning_rate": 4.806709285838031e-05, + "loss": 0.8726, + "step": 890 + }, + { + "epoch": 0.25, + "learning_rate": 4.8023997336853434e-05, + "loss": 0.8664, + "step": 900 + }, + { + "epoch": 0.26, + "learning_rate": 4.7980446430689804e-05, + "loss": 0.8805, + "step": 910 + }, + { + "epoch": 0.26, + "learning_rate": 4.793644100126954e-05, + "loss": 0.878, + "step": 920 + }, + { + "epoch": 0.26, + "learning_rate": 4.7891981918962656e-05, + "loss": 0.8632, + "step": 930 + }, + { + "epoch": 0.27, + "learning_rate": 4.784707006311179e-05, + "loss": 0.8614, + "step": 940 + }, + { + "epoch": 0.27, + "learning_rate": 4.780170632201487e-05, + "loss": 0.8629, + "step": 950 + }, + { + "epoch": 0.27, + "learning_rate": 4.7755891592907556e-05, + "loss": 0.8635, + "step": 960 + }, + { + "epoch": 0.27, + "learning_rate": 4.7709626781945397e-05, + "loss": 0.8525, + "step": 970 + }, + { + "epoch": 0.28, + "learning_rate": 4.766291280418603e-05, + "loss": 0.8592, + "step": 980 + }, + { + "epoch": 0.28, + "learning_rate": 4.761575058357101e-05, + "loss": 0.8621, + "step": 990 + }, + { + "epoch": 0.28, + "learning_rate": 4.756814105290753e-05, + "loss": 0.8687, + "step": 1000 + }, + { + "epoch": 0.29, + "learning_rate": 4.7520085153850014e-05, + "loss": 0.8524, + "step": 1010 + }, + { + "epoch": 0.29, + "learning_rate": 4.7471583836881476e-05, + "loss": 0.8687, + "step": 1020 + }, + { + "epoch": 0.29, + "learning_rate": 4.742263806129469e-05, + "loss": 0.8505, + "step": 1030 + }, + { + "epoch": 0.29, + "learning_rate": 4.737324879517326e-05, + "loss": 0.8754, + "step": 1040 + }, + { + "epoch": 0.3, + "learning_rate": 4.732341701537245e-05, + "loss": 0.8583, + "step": 1050 + }, + { + "epoch": 0.3, + "learning_rate": 4.727314370749988e-05, + "loss": 0.8698, + "step": 1060 + }, + { + "epoch": 0.3, + "learning_rate": 4.7222429865896e-05, + "loss": 0.8661, + "step": 1070 + }, + { + "epoch": 0.31, + "learning_rate": 4.717127649361444e-05, + "loss": 0.8574, + "step": 1080 + }, + { + "epoch": 0.31, + "learning_rate": 4.71196846024022e-05, + "loss": 0.852, + "step": 1090 + }, + { + "epoch": 0.31, + "learning_rate": 4.7067655212679585e-05, + "loss": 0.8619, + "step": 1100 + }, + { + "epoch": 0.31, + "learning_rate": 4.701518935352006e-05, + "loss": 0.8632, + "step": 1110 + }, + { + "epoch": 0.32, + "learning_rate": 4.69622880626299e-05, + "loss": 0.8529, + "step": 1120 + }, + { + "epoch": 0.32, + "learning_rate": 4.690895238632762e-05, + "loss": 0.8529, + "step": 1130 + }, + { + "epoch": 0.32, + "learning_rate": 4.685518337952335e-05, + "loss": 0.8465, + "step": 1140 + }, + { + "epoch": 0.33, + "learning_rate": 4.680098210569789e-05, + "loss": 0.8604, + "step": 1150 + }, + { + "epoch": 0.33, + "learning_rate": 4.674634963688177e-05, + "loss": 0.8649, + "step": 1160 + }, + { + "epoch": 0.33, + "learning_rate": 4.669128705363394e-05, + "loss": 0.8572, + "step": 1170 + }, + { + "epoch": 0.33, + "learning_rate": 4.663579544502049e-05, + "loss": 0.8634, + "step": 1180 + }, + { + "epoch": 0.34, + "learning_rate": 4.657987590859305e-05, + "loss": 0.8478, + "step": 1190 + }, + { + "epoch": 0.34, + "learning_rate": 4.652352955036713e-05, + "loss": 0.8475, + "step": 1200 + }, + { + "epoch": 0.34, + "learning_rate": 4.646675748480019e-05, + "loss": 0.8537, + "step": 1210 + }, + { + "epoch": 0.35, + "learning_rate": 4.640956083476964e-05, + "loss": 0.8499, + "step": 1220 + }, + { + "epoch": 0.35, + "learning_rate": 4.635194073155061e-05, + "loss": 0.8467, + "step": 1230 + }, + { + "epoch": 0.35, + "learning_rate": 4.62938983147936e-05, + "loss": 0.8538, + "step": 1240 + }, + { + "epoch": 0.35, + "learning_rate": 4.62354347325019e-05, + "loss": 0.8619, + "step": 1250 + }, + { + "epoch": 0.36, + "learning_rate": 4.6176551141008916e-05, + "loss": 0.8593, + "step": 1260 + }, + { + "epoch": 0.36, + "learning_rate": 4.611724870495528e-05, + "loss": 0.8484, + "step": 1270 + }, + { + "epoch": 0.36, + "learning_rate": 4.605752859726583e-05, + "loss": 0.8395, + "step": 1280 + }, + { + "epoch": 0.37, + "learning_rate": 4.5997391999126397e-05, + "loss": 0.8547, + "step": 1290 + }, + { + "epoch": 0.37, + "learning_rate": 4.5936840099960465e-05, + "loss": 0.8586, + "step": 1300 + }, + { + "epoch": 0.37, + "learning_rate": 4.587587409740561e-05, + "loss": 0.839, + "step": 1310 + }, + { + "epoch": 0.37, + "learning_rate": 4.581449519728986e-05, + "loss": 0.8417, + "step": 1320 + }, + { + "epoch": 0.38, + "learning_rate": 4.575270461360779e-05, + "loss": 0.8404, + "step": 1330 + }, + { + "epoch": 0.38, + "learning_rate": 4.569050356849655e-05, + "loss": 0.843, + "step": 1340 + }, + { + "epoch": 0.38, + "learning_rate": 4.562789329221169e-05, + "loss": 0.8557, + "step": 1350 + }, + { + "epoch": 0.39, + "learning_rate": 4.5564875023102796e-05, + "loss": 0.8504, + "step": 1360 + }, + { + "epoch": 0.39, + "learning_rate": 4.550145000758905e-05, + "loss": 0.8579, + "step": 1370 + }, + { + "epoch": 0.39, + "learning_rate": 4.543761950013453e-05, + "loss": 0.8563, + "step": 1380 + }, + { + "epoch": 0.39, + "learning_rate": 4.537338476322341e-05, + "loss": 0.8446, + "step": 1390 + }, + { + "epoch": 0.4, + "learning_rate": 4.530874706733502e-05, + "loss": 0.8524, + "step": 1400 + }, + { + "epoch": 0.4, + "learning_rate": 4.524370769091866e-05, + "loss": 0.8417, + "step": 1410 + }, + { + "epoch": 0.4, + "learning_rate": 4.5178267920368366e-05, + "loss": 0.8582, + "step": 1420 + }, + { + "epoch": 0.4, + "learning_rate": 4.511242904999746e-05, + "loss": 0.841, + "step": 1430 + }, + { + "epoch": 0.41, + "learning_rate": 4.50461923820129e-05, + "loss": 0.8529, + "step": 1440 + }, + { + "epoch": 0.41, + "learning_rate": 4.497955922648961e-05, + "loss": 0.8545, + "step": 1450 + }, + { + "epoch": 0.41, + "learning_rate": 4.491253090134447e-05, + "loss": 0.8471, + "step": 1460 + }, + { + "epoch": 0.42, + "learning_rate": 4.4845108732310355e-05, + "loss": 0.8379, + "step": 1470 + }, + { + "epoch": 0.42, + "learning_rate": 4.4777294052909804e-05, + "loss": 0.8542, + "step": 1480 + }, + { + "epoch": 0.42, + "learning_rate": 4.470908820442873e-05, + "loss": 0.8463, + "step": 1490 + }, + { + "epoch": 0.42, + "learning_rate": 4.464049253588985e-05, + "loss": 0.8362, + "step": 1500 + }, + { + "epoch": 0.43, + "learning_rate": 4.457150840402604e-05, + "loss": 0.8467, + "step": 1510 + }, + { + "epoch": 0.43, + "learning_rate": 4.450213717325343e-05, + "loss": 0.8501, + "step": 1520 + }, + { + "epoch": 0.43, + "learning_rate": 4.443238021564448e-05, + "loss": 0.8541, + "step": 1530 + }, + { + "epoch": 0.44, + "learning_rate": 4.4362238910900835e-05, + "loss": 0.8443, + "step": 1540 + }, + { + "epoch": 0.44, + "learning_rate": 4.4291714646326024e-05, + "loss": 0.8297, + "step": 1550 + }, + { + "epoch": 0.44, + "learning_rate": 4.4220808816797995e-05, + "loss": 0.8532, + "step": 1560 + }, + { + "epoch": 0.44, + "learning_rate": 4.414952282474158e-05, + "loss": 0.854, + "step": 1570 + }, + { + "epoch": 0.45, + "learning_rate": 4.407785808010073e-05, + "loss": 0.849, + "step": 1580 + }, + { + "epoch": 0.45, + "learning_rate": 4.400581600031062e-05, + "loss": 0.8516, + "step": 1590 + }, + { + "epoch": 0.45, + "learning_rate": 4.3933398010269614e-05, + "loss": 0.8394, + "step": 1600 + }, + { + "epoch": 0.46, + "learning_rate": 4.386060554231111e-05, + "loss": 0.8399, + "step": 1610 + }, + { + "epoch": 0.46, + "learning_rate": 4.378744003617517e-05, + "loss": 0.8242, + "step": 1620 + }, + { + "epoch": 0.46, + "learning_rate": 4.371390293898007e-05, + "loss": 0.8395, + "step": 1630 + }, + { + "epoch": 0.46, + "learning_rate": 4.3639995705193684e-05, + "loss": 0.8355, + "step": 1640 + }, + { + "epoch": 0.47, + "learning_rate": 4.3565719796604706e-05, + "loss": 0.8299, + "step": 1650 + }, + { + "epoch": 0.47, + "learning_rate": 4.3491076682293715e-05, + "loss": 0.8272, + "step": 1660 + }, + { + "epoch": 0.47, + "learning_rate": 4.341606783860416e-05, + "loss": 0.8336, + "step": 1670 + }, + { + "epoch": 0.48, + "learning_rate": 4.334069474911313e-05, + "loss": 0.8264, + "step": 1680 + }, + { + "epoch": 0.48, + "learning_rate": 4.326495890460204e-05, + "loss": 0.8381, + "step": 1690 + }, + { + "epoch": 0.48, + "learning_rate": 4.3188861803027094e-05, + "loss": 0.8278, + "step": 1700 + }, + { + "epoch": 0.48, + "learning_rate": 4.3112404949489715e-05, + "loss": 0.8458, + "step": 1710 + }, + { + "epoch": 0.49, + "learning_rate": 4.303558985620673e-05, + "loss": 0.8348, + "step": 1720 + }, + { + "epoch": 0.49, + "learning_rate": 4.2958418042480506e-05, + "loss": 0.814, + "step": 1730 + }, + { + "epoch": 0.49, + "learning_rate": 4.288089103466886e-05, + "loss": 0.838, + "step": 1740 + }, + { + "epoch": 0.5, + "learning_rate": 4.280301036615489e-05, + "loss": 0.824, + "step": 1750 + }, + { + "epoch": 0.5, + "learning_rate": 4.272477757731662e-05, + "loss": 0.8314, + "step": 1760 + }, + { + "epoch": 0.5, + "learning_rate": 4.2646194215496595e-05, + "loss": 0.821, + "step": 1770 + }, + { + "epoch": 0.5, + "learning_rate": 4.2567261834971206e-05, + "loss": 0.8311, + "step": 1780 + }, + { + "epoch": 0.51, + "learning_rate": 4.248798199691998e-05, + "loss": 0.8443, + "step": 1790 + }, + { + "epoch": 0.51, + "learning_rate": 4.2408356269394714e-05, + "loss": 0.8315, + "step": 1800 + }, + { + "epoch": 0.51, + "learning_rate": 4.2328386227288445e-05, + "loss": 0.8184, + "step": 1810 + }, + { + "epoch": 0.52, + "learning_rate": 4.224807345230429e-05, + "loss": 0.8364, + "step": 1820 + }, + { + "epoch": 0.52, + "learning_rate": 4.21674195329242e-05, + "loss": 0.8186, + "step": 1830 + }, + { + "epoch": 0.52, + "learning_rate": 4.208642606437748e-05, + "loss": 0.8454, + "step": 1840 + }, + { + "epoch": 0.52, + "learning_rate": 4.2005094648609325e-05, + "loss": 0.832, + "step": 1850 + }, + { + "epoch": 0.53, + "learning_rate": 4.192342689424903e-05, + "loss": 0.8027, + "step": 1860 + }, + { + "epoch": 0.53, + "learning_rate": 4.184142441657827e-05, + "loss": 0.8365, + "step": 1870 + }, + { + "epoch": 0.53, + "learning_rate": 4.1759088837499095e-05, + "loss": 0.8523, + "step": 1880 + }, + { + "epoch": 0.54, + "learning_rate": 4.167642178550186e-05, + "loss": 0.8377, + "step": 1890 + }, + { + "epoch": 0.54, + "learning_rate": 4.159342489563304e-05, + "loss": 0.8299, + "step": 1900 + }, + { + "epoch": 0.54, + "learning_rate": 4.151009980946287e-05, + "loss": 0.8273, + "step": 1910 + }, + { + "epoch": 0.54, + "learning_rate": 4.142644817505284e-05, + "loss": 0.813, + "step": 1920 + }, + { + "epoch": 0.55, + "learning_rate": 4.1342471646923196e-05, + "loss": 0.8262, + "step": 1930 + }, + { + "epoch": 0.55, + "learning_rate": 4.1258171886020124e-05, + "loss": 0.8258, + "step": 1940 + }, + { + "epoch": 0.55, + "learning_rate": 4.117355055968295e-05, + "loss": 0.8248, + "step": 1950 + }, + { + "epoch": 0.55, + "learning_rate": 4.1088609341611135e-05, + "loss": 0.8123, + "step": 1960 + }, + { + "epoch": 0.56, + "learning_rate": 4.1003349911831166e-05, + "loss": 0.8304, + "step": 1970 + }, + { + "epoch": 0.56, + "learning_rate": 4.091777395666338e-05, + "loss": 0.849, + "step": 1980 + }, + { + "epoch": 0.56, + "learning_rate": 4.0831883168688534e-05, + "loss": 0.8255, + "step": 1990 + }, + { + "epoch": 0.57, + "learning_rate": 4.07456792467144e-05, + "loss": 0.8317, + "step": 2000 + }, + { + "epoch": 0.57, + "learning_rate": 4.065916389574211e-05, + "loss": 0.8331, + "step": 2010 + }, + { + "epoch": 0.57, + "learning_rate": 4.057233882693246e-05, + "loss": 0.8309, + "step": 2020 + }, + { + "epoch": 0.57, + "learning_rate": 4.048520575757207e-05, + "loss": 0.8117, + "step": 2030 + }, + { + "epoch": 0.58, + "learning_rate": 4.0397766411039395e-05, + "loss": 0.8155, + "step": 2040 + }, + { + "epoch": 0.58, + "learning_rate": 4.031002251677067e-05, + "loss": 0.8178, + "step": 2050 + }, + { + "epoch": 0.58, + "learning_rate": 4.022197581022567e-05, + "loss": 0.8155, + "step": 2060 + }, + { + "epoch": 0.59, + "learning_rate": 4.0133628032853435e-05, + "loss": 0.8273, + "step": 2070 + }, + { + "epoch": 0.59, + "learning_rate": 4.004498093205773e-05, + "loss": 0.8021, + "step": 2080 + }, + { + "epoch": 0.59, + "learning_rate": 3.99560362611626e-05, + "loss": 0.8374, + "step": 2090 + }, + { + "epoch": 0.59, + "learning_rate": 3.986679577937762e-05, + "loss": 0.8173, + "step": 2100 + }, + { + "epoch": 0.6, + "learning_rate": 3.9777261251763145e-05, + "loss": 0.8227, + "step": 2110 + }, + { + "epoch": 0.6, + "learning_rate": 3.9687434449195316e-05, + "loss": 0.8275, + "step": 2120 + }, + { + "epoch": 0.6, + "learning_rate": 3.959731714833115e-05, + "loss": 0.8226, + "step": 2130 + }, + { + "epoch": 0.61, + "learning_rate": 3.95069111315733e-05, + "loss": 0.815, + "step": 2140 + }, + { + "epoch": 0.61, + "learning_rate": 3.9416218187034876e-05, + "loss": 0.8306, + "step": 2150 + }, + { + "epoch": 0.61, + "learning_rate": 3.9325240108504016e-05, + "loss": 0.8424, + "step": 2160 + }, + { + "epoch": 0.61, + "learning_rate": 3.923397869540845e-05, + "loss": 0.8051, + "step": 2170 + }, + { + "epoch": 0.62, + "learning_rate": 3.91424357527799e-05, + "loss": 0.8117, + "step": 2180 + }, + { + "epoch": 0.62, + "learning_rate": 3.905061309121837e-05, + "loss": 0.8123, + "step": 2190 + }, + { + "epoch": 0.62, + "learning_rate": 3.895851252685634e-05, + "loss": 0.8038, + "step": 2200 + }, + { + "epoch": 0.63, + "learning_rate": 3.886613588132284e-05, + "loss": 0.8308, + "step": 2210 + }, + { + "epoch": 0.63, + "learning_rate": 3.877348498170743e-05, + "loss": 0.8187, + "step": 2220 + }, + { + "epoch": 0.63, + "learning_rate": 3.868056166052407e-05, + "loss": 0.8274, + "step": 2230 + }, + { + "epoch": 0.63, + "learning_rate": 3.858736775567484e-05, + "loss": 0.8171, + "step": 2240 + }, + { + "epoch": 0.64, + "learning_rate": 3.8493905110413626e-05, + "loss": 0.8213, + "step": 2250 + }, + { + "epoch": 0.64, + "learning_rate": 3.8400175573309646e-05, + "loss": 0.8241, + "step": 2260 + }, + { + "epoch": 0.64, + "learning_rate": 3.83061809982109e-05, + "loss": 0.8296, + "step": 2270 + }, + { + "epoch": 0.65, + "learning_rate": 3.821192324420747e-05, + "loss": 0.8247, + "step": 2280 + }, + { + "epoch": 0.65, + "learning_rate": 3.8117404175594795e-05, + "loss": 0.8399, + "step": 2290 + }, + { + "epoch": 0.65, + "learning_rate": 3.8022625661836775e-05, + "loss": 0.8015, + "step": 2300 + }, + { + "epoch": 0.65, + "learning_rate": 3.792758957752879e-05, + "loss": 0.8204, + "step": 2310 + }, + { + "epoch": 0.66, + "learning_rate": 3.783229780236062e-05, + "loss": 0.8198, + "step": 2320 + }, + { + "epoch": 0.66, + "learning_rate": 3.773675222107929e-05, + "loss": 0.8045, + "step": 2330 + }, + { + "epoch": 0.66, + "learning_rate": 3.7640954723451784e-05, + "loss": 0.8185, + "step": 2340 + }, + { + "epoch": 0.67, + "learning_rate": 3.7544907204227646e-05, + "loss": 0.8123, + "step": 2350 + }, + { + "epoch": 0.67, + "learning_rate": 3.7448611563101536e-05, + "loss": 0.8093, + "step": 2360 + }, + { + "epoch": 0.67, + "learning_rate": 3.735206970467564e-05, + "loss": 0.8194, + "step": 2370 + }, + { + "epoch": 0.67, + "learning_rate": 3.7255283538421984e-05, + "loss": 0.8121, + "step": 2380 + }, + { + "epoch": 0.68, + "learning_rate": 3.7158254978644703e-05, + "loss": 0.811, + "step": 2390 + }, + { + "epoch": 0.68, + "learning_rate": 3.706098594444216e-05, + "loss": 0.8013, + "step": 2400 + }, + { + "epoch": 0.68, + "learning_rate": 3.6963478359668966e-05, + "loss": 0.8215, + "step": 2410 + }, + { + "epoch": 0.69, + "learning_rate": 3.6865734152897987e-05, + "loss": 0.8079, + "step": 2420 + }, + { + "epoch": 0.69, + "learning_rate": 3.676775525738213e-05, + "loss": 0.821, + "step": 2430 + }, + { + "epoch": 0.69, + "learning_rate": 3.666954361101616e-05, + "loss": 0.8097, + "step": 2440 + }, + { + "epoch": 0.69, + "learning_rate": 3.657110115629832e-05, + "loss": 0.8046, + "step": 2450 + }, + { + "epoch": 0.7, + "learning_rate": 3.647242984029201e-05, + "loss": 0.8112, + "step": 2460 + }, + { + "epoch": 0.7, + "learning_rate": 3.637353161458713e-05, + "loss": 0.8099, + "step": 2470 + }, + { + "epoch": 0.7, + "learning_rate": 3.627440843526158e-05, + "loss": 0.8148, + "step": 2480 + }, + { + "epoch": 0.7, + "learning_rate": 3.6175062262842585e-05, + "loss": 0.8105, + "step": 2490 + }, + { + "epoch": 0.71, + "learning_rate": 3.607549506226784e-05, + "loss": 0.8132, + "step": 2500 + }, + { + "epoch": 0.71, + "learning_rate": 3.5975708802846725e-05, + "loss": 0.8149, + "step": 2510 + }, + { + "epoch": 0.71, + "learning_rate": 3.587570545822128e-05, + "loss": 0.8306, + "step": 2520 + }, + { + "epoch": 0.72, + "learning_rate": 3.5775487006327215e-05, + "loss": 0.8106, + "step": 2530 + }, + { + "epoch": 0.72, + "learning_rate": 3.567505542935482e-05, + "loss": 0.8192, + "step": 2540 + }, + { + "epoch": 0.72, + "learning_rate": 3.557441271370968e-05, + "loss": 0.8129, + "step": 2550 + }, + { + "epoch": 0.72, + "learning_rate": 3.547356084997344e-05, + "loss": 0.8155, + "step": 2560 + }, + { + "epoch": 0.73, + "learning_rate": 3.537250183286443e-05, + "loss": 0.8039, + "step": 2570 + }, + { + "epoch": 0.73, + "learning_rate": 3.527123766119818e-05, + "loss": 0.8109, + "step": 2580 + }, + { + "epoch": 0.73, + "learning_rate": 3.5169770337847935e-05, + "loss": 0.8063, + "step": 2590 + }, + { + "epoch": 0.74, + "learning_rate": 3.5068101869705004e-05, + "loss": 0.8275, + "step": 2600 + }, + { + "epoch": 0.74, + "learning_rate": 3.496623426763908e-05, + "loss": 0.8107, + "step": 2610 + }, + { + "epoch": 0.74, + "learning_rate": 3.486416954645846e-05, + "loss": 0.8047, + "step": 2620 + }, + { + "epoch": 0.74, + "learning_rate": 3.4761909724870205e-05, + "loss": 0.8123, + "step": 2630 + }, + { + "epoch": 0.75, + "learning_rate": 3.4659456825440216e-05, + "loss": 0.8241, + "step": 2640 + }, + { + "epoch": 0.75, + "learning_rate": 3.4556812874553204e-05, + "loss": 0.812, + "step": 2650 + }, + { + "epoch": 0.75, + "learning_rate": 3.445397990237264e-05, + "loss": 0.8161, + "step": 2660 + }, + { + "epoch": 0.76, + "learning_rate": 3.4350959942800584e-05, + "loss": 0.797, + "step": 2670 + }, + { + "epoch": 0.76, + "learning_rate": 3.424775503343747e-05, + "loss": 0.8155, + "step": 2680 + }, + { + "epoch": 0.76, + "learning_rate": 3.414436721554179e-05, + "loss": 0.797, + "step": 2690 + }, + { + "epoch": 0.76, + "learning_rate": 3.4040798533989745e-05, + "loss": 0.8153, + "step": 2700 + }, + { + "epoch": 0.77, + "learning_rate": 3.3937051037234745e-05, + "loss": 0.8016, + "step": 2710 + }, + { + "epoch": 0.77, + "learning_rate": 3.3833126777266974e-05, + "loss": 0.8138, + "step": 2720 + }, + { + "epoch": 0.77, + "learning_rate": 3.3729027809572735e-05, + "loss": 0.8178, + "step": 2730 + }, + { + "epoch": 0.78, + "learning_rate": 3.3624756193093835e-05, + "loss": 0.8062, + "step": 2740 + }, + { + "epoch": 0.78, + "learning_rate": 3.3520313990186856e-05, + "loss": 0.8101, + "step": 2750 + }, + { + "epoch": 0.78, + "learning_rate": 3.341570326658232e-05, + "loss": 0.7982, + "step": 2760 + }, + { + "epoch": 0.78, + "learning_rate": 3.331092609134392e-05, + "loss": 0.8021, + "step": 2770 + }, + { + "epoch": 0.79, + "learning_rate": 3.32059845368275e-05, + "loss": 0.817, + "step": 2780 + }, + { + "epoch": 0.79, + "learning_rate": 3.310088067864015e-05, + "loss": 0.8083, + "step": 2790 + }, + { + "epoch": 0.79, + "learning_rate": 3.299561659559909e-05, + "loss": 0.8047, + "step": 2800 + }, + { + "epoch": 0.8, + "learning_rate": 3.289019436969057e-05, + "loss": 0.8, + "step": 2810 + }, + { + "epoch": 0.8, + "learning_rate": 3.278461608602873e-05, + "loss": 0.8063, + "step": 2820 + }, + { + "epoch": 0.8, + "learning_rate": 3.267888383281431e-05, + "loss": 0.8139, + "step": 2830 + }, + { + "epoch": 0.8, + "learning_rate": 3.257299970129336e-05, + "loss": 0.8075, + "step": 2840 + }, + { + "epoch": 0.81, + "learning_rate": 3.246696578571592e-05, + "loss": 0.8056, + "step": 2850 + }, + { + "epoch": 0.81, + "learning_rate": 3.236078418329452e-05, + "loss": 0.8242, + "step": 2860 + }, + { + "epoch": 0.81, + "learning_rate": 3.225445699416276e-05, + "loss": 0.8041, + "step": 2870 + }, + { + "epoch": 0.82, + "learning_rate": 3.214798632133376e-05, + "loss": 0.8088, + "step": 2880 + }, + { + "epoch": 0.82, + "learning_rate": 3.204137427065857e-05, + "loss": 0.8121, + "step": 2890 + }, + { + "epoch": 0.82, + "learning_rate": 3.193462295078448e-05, + "loss": 0.8151, + "step": 2900 + }, + { + "epoch": 0.82, + "learning_rate": 3.1827734473113356e-05, + "loss": 0.8064, + "step": 2910 + }, + { + "epoch": 0.83, + "learning_rate": 3.172071095175989e-05, + "loss": 0.8151, + "step": 2920 + }, + { + "epoch": 0.83, + "learning_rate": 3.1613554503509715e-05, + "loss": 0.7942, + "step": 2930 + }, + { + "epoch": 0.83, + "learning_rate": 3.1506267247777645e-05, + "loss": 0.8131, + "step": 2940 + }, + { + "epoch": 0.84, + "learning_rate": 3.139885130656563e-05, + "loss": 0.8015, + "step": 2950 + }, + { + "epoch": 0.84, + "learning_rate": 3.129130880442091e-05, + "loss": 0.8053, + "step": 2960 + }, + { + "epoch": 0.84, + "learning_rate": 3.118364186839389e-05, + "loss": 0.7986, + "step": 2970 + }, + { + "epoch": 0.84, + "learning_rate": 3.107585262799613e-05, + "loss": 0.7936, + "step": 2980 + }, + { + "epoch": 0.85, + "learning_rate": 3.096794321515823e-05, + "loss": 0.8235, + "step": 2990 + }, + { + "epoch": 0.85, + "learning_rate": 3.0859915764187616e-05, + "loss": 0.8083, + "step": 3000 + } + ], + "max_steps": 7064, + "num_train_epochs": 2, + "total_flos": 1.062254149276323e+19, + "trial_name": null, + "trial_params": null +} diff --git a/sft-lora/checkpoint-3000/training_args.bin b/sft-lora/checkpoint-3000/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..3eed0ff4867b1994122fd7acbeae2361d0d3b65f --- /dev/null +++ b/sft-lora/checkpoint-3000/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f9990bd8d9bf61dcf0d79a1a831b0934c6cc3a114d136458fc4cdd6dc2a9387 +size 3272 diff --git a/sft-lora/checkpoint-4000/README.md b/sft-lora/checkpoint-4000/README.md new file mode 100644 index 0000000000000000000000000000000000000000..d290c902d52b2091d490255d35c9be86df84f437 --- /dev/null +++ b/sft-lora/checkpoint-4000/README.md @@ -0,0 +1,3 @@ +--- +library_name: peft +--- diff --git a/sft-lora/checkpoint-4000/adapter_config.json b/sft-lora/checkpoint-4000/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..2ef4676864a7f782259cd6700dcab8059e8973ab --- /dev/null +++ b/sft-lora/checkpoint-4000/adapter_config.json @@ -0,0 +1,20 @@ +{ + "base_model_name_or_path": "llama-13b-hf/", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layers_pattern": null, + "layers_to_transform": null, + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "revision": null, + "target_modules": [ + "q_proj", + "v_proj" + ], + "task_type": "CAUSAL_LM" +} \ No newline at end of file diff --git a/sft-lora/checkpoint-4000/adapter_model.bin b/sft-lora/checkpoint-4000/adapter_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..2eb5c2665edecbf3b9e447cb7ff3292e0cc9cf2f --- /dev/null +++ b/sft-lora/checkpoint-4000/adapter_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:227d9b846b8503334aed55d6bc835b6c882f7ca4d7c4a68cb689ce99243573b7 +size 26269517 diff --git a/sft-lora/checkpoint-4000/finetuning_args.json b/sft-lora/checkpoint-4000/finetuning_args.json new file mode 100644 index 0000000000000000000000000000000000000000..36a921b3eb84159ad54e7697e9d7d3e2fde38fec --- /dev/null +++ b/sft-lora/checkpoint-4000/finetuning_args.json @@ -0,0 +1,13 @@ +{ + "finetuning_type": "lora", + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "lora_rank": 8, + "lora_target": [ + "q_proj", + "v_proj" + ], + "name_module_trainable": "mlp", + "num_hidden_layers": 32, + "num_layer_trainable": 3 +} diff --git a/sft-lora/checkpoint-4000/optimizer.pt b/sft-lora/checkpoint-4000/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..dbb18aed73af4f143374effacb41c0bc9f7b324d --- /dev/null +++ b/sft-lora/checkpoint-4000/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87cf16661a25f70009edd1ad211bd32f16759e498b5fdda597ce49e836a9eb5b +size 52562821 diff --git a/sft-lora/checkpoint-4000/rng_state_0.pth b/sft-lora/checkpoint-4000/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..3767665ccfb89290b870aca38b4ff390d5a94306 --- /dev/null +++ b/sft-lora/checkpoint-4000/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5978240c798217567b7409b3e3c7de5f7291e7ae6eb4c309423593affef4653b +size 18679 diff --git a/sft-lora/checkpoint-4000/rng_state_1.pth b/sft-lora/checkpoint-4000/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..f6e40d09f3e4e39f635158cffb8df47fa3f46a40 --- /dev/null +++ b/sft-lora/checkpoint-4000/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f64f4894fc31ab7c0c49ae19facf802bebc8846340239b23a7ad9f2f7a0e1d1a +size 18679 diff --git a/sft-lora/checkpoint-4000/rng_state_2.pth b/sft-lora/checkpoint-4000/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..f9e9f58f17b641ff0e3d9da55d8d48899d005921 --- /dev/null +++ b/sft-lora/checkpoint-4000/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b7ded5e4425f3a43a00810873c05393ff8acafce3f3347f9b2a6673dbaa1939 +size 18679 diff --git a/sft-lora/checkpoint-4000/rng_state_3.pth b/sft-lora/checkpoint-4000/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..ebaab8b29c2507ada6c2782d4b725caa8ec483b6 --- /dev/null +++ b/sft-lora/checkpoint-4000/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0cb9df962e1207e2a5858e2bcf9d6f4123a9a9f636f71f15d2d6dca8f8248092 +size 18679 diff --git a/sft-lora/checkpoint-4000/scheduler.pt b/sft-lora/checkpoint-4000/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a2d33d284e4848bd18d8934b7e240129b62bf4d --- /dev/null +++ b/sft-lora/checkpoint-4000/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:faf7e35bc1d9d6e77c904ac697970bf3fe9271b75c118e224f479ab9fa296d48 +size 627 diff --git a/sft-lora/checkpoint-4000/trainer_state.json b/sft-lora/checkpoint-4000/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..297467ba5de98deff0bf36ca33f447d489f07e63 --- /dev/null +++ b/sft-lora/checkpoint-4000/trainer_state.json @@ -0,0 +1,2416 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 1.1325028312570782, + "global_step": 4000, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.0, + "learning_rate": 4.9999752766303955e-05, + "loss": 1.293, + "step": 10 + }, + { + "epoch": 0.01, + "learning_rate": 4.999901107010577e-05, + "loss": 1.2584, + "step": 20 + }, + { + "epoch": 0.01, + "learning_rate": 4.999777492607524e-05, + "loss": 1.2075, + "step": 30 + }, + { + "epoch": 0.01, + "learning_rate": 4.9996044358661676e-05, + "loss": 1.1718, + "step": 40 + }, + { + "epoch": 0.01, + "learning_rate": 4.9993819402093446e-05, + "loss": 1.1483, + "step": 50 + }, + { + "epoch": 0.02, + "learning_rate": 4.999110010037728e-05, + "loss": 1.122, + "step": 60 + }, + { + "epoch": 0.02, + "learning_rate": 4.998788650729743e-05, + "loss": 1.0971, + "step": 70 + }, + { + "epoch": 0.02, + "learning_rate": 4.998417868641457e-05, + "loss": 1.0756, + "step": 80 + }, + { + "epoch": 0.03, + "learning_rate": 4.9979976711064556e-05, + "loss": 1.0673, + "step": 90 + }, + { + "epoch": 0.03, + "learning_rate": 4.9975280664357e-05, + "loss": 1.0705, + "step": 100 + }, + { + "epoch": 0.03, + "learning_rate": 4.997009063917356e-05, + "loss": 1.0673, + "step": 110 + }, + { + "epoch": 0.03, + "learning_rate": 4.996440673816617e-05, + "loss": 1.031, + "step": 120 + }, + { + "epoch": 0.04, + "learning_rate": 4.995822907375498e-05, + "loss": 1.0383, + "step": 130 + }, + { + "epoch": 0.04, + "learning_rate": 4.9951557768126136e-05, + "loss": 1.0097, + "step": 140 + }, + { + "epoch": 0.04, + "learning_rate": 4.9944392953229365e-05, + "loss": 1.012, + "step": 150 + }, + { + "epoch": 0.05, + "learning_rate": 4.993673477077535e-05, + "loss": 0.9834, + "step": 160 + }, + { + "epoch": 0.05, + "learning_rate": 4.9928583372232954e-05, + "loss": 0.9908, + "step": 170 + }, + { + "epoch": 0.05, + "learning_rate": 4.991993891882622e-05, + "loss": 0.9908, + "step": 180 + }, + { + "epoch": 0.05, + "learning_rate": 4.991080158153115e-05, + "loss": 0.9913, + "step": 190 + }, + { + "epoch": 0.06, + "learning_rate": 4.990117154107236e-05, + "loss": 0.9782, + "step": 200 + }, + { + "epoch": 0.06, + "learning_rate": 4.989104898791949e-05, + "loss": 0.9954, + "step": 210 + }, + { + "epoch": 0.06, + "learning_rate": 4.988043412228343e-05, + "loss": 0.975, + "step": 220 + }, + { + "epoch": 0.07, + "learning_rate": 4.986932715411239e-05, + "loss": 0.9687, + "step": 230 + }, + { + "epoch": 0.07, + "learning_rate": 4.985772830308771e-05, + "loss": 0.9677, + "step": 240 + }, + { + "epoch": 0.07, + "learning_rate": 4.9845637798619536e-05, + "loss": 0.9715, + "step": 250 + }, + { + "epoch": 0.07, + "learning_rate": 4.983305587984227e-05, + "loss": 0.9692, + "step": 260 + }, + { + "epoch": 0.08, + "learning_rate": 4.981998279560986e-05, + "loss": 0.9627, + "step": 270 + }, + { + "epoch": 0.08, + "learning_rate": 4.980641880449086e-05, + "loss": 0.9784, + "step": 280 + }, + { + "epoch": 0.08, + "learning_rate": 4.9792364174763323e-05, + "loss": 0.941, + "step": 290 + }, + { + "epoch": 0.08, + "learning_rate": 4.977781918440949e-05, + "loss": 0.9623, + "step": 300 + }, + { + "epoch": 0.09, + "learning_rate": 4.97627841211103e-05, + "loss": 0.9401, + "step": 310 + }, + { + "epoch": 0.09, + "learning_rate": 4.97472592822397e-05, + "loss": 0.9152, + "step": 320 + }, + { + "epoch": 0.09, + "learning_rate": 4.9731244974858746e-05, + "loss": 0.9405, + "step": 330 + }, + { + "epoch": 0.1, + "learning_rate": 4.971474151570955e-05, + "loss": 0.9431, + "step": 340 + }, + { + "epoch": 0.1, + "learning_rate": 4.9697749231209025e-05, + "loss": 0.9512, + "step": 350 + }, + { + "epoch": 0.1, + "learning_rate": 4.968026845744237e-05, + "loss": 0.9301, + "step": 360 + }, + { + "epoch": 0.1, + "learning_rate": 4.96622995401565e-05, + "loss": 0.917, + "step": 370 + }, + { + "epoch": 0.11, + "learning_rate": 4.9643842834753174e-05, + "loss": 0.9162, + "step": 380 + }, + { + "epoch": 0.11, + "learning_rate": 4.962489870628193e-05, + "loss": 0.9207, + "step": 390 + }, + { + "epoch": 0.11, + "learning_rate": 4.960546752943294e-05, + "loss": 0.924, + "step": 400 + }, + { + "epoch": 0.12, + "learning_rate": 4.958554968852952e-05, + "loss": 0.9025, + "step": 410 + }, + { + "epoch": 0.12, + "learning_rate": 4.95651455775206e-05, + "loss": 0.9027, + "step": 420 + }, + { + "epoch": 0.12, + "learning_rate": 4.954425559997287e-05, + "loss": 0.9167, + "step": 430 + }, + { + "epoch": 0.12, + "learning_rate": 4.952288016906284e-05, + "loss": 0.9119, + "step": 440 + }, + { + "epoch": 0.13, + "learning_rate": 4.9501019707568665e-05, + "loss": 0.9042, + "step": 450 + }, + { + "epoch": 0.13, + "learning_rate": 4.947867464786174e-05, + "loss": 0.9113, + "step": 460 + }, + { + "epoch": 0.13, + "learning_rate": 4.945584543189823e-05, + "loss": 0.9297, + "step": 470 + }, + { + "epoch": 0.14, + "learning_rate": 4.943253251121022e-05, + "loss": 0.9194, + "step": 480 + }, + { + "epoch": 0.14, + "learning_rate": 4.9408736346896894e-05, + "loss": 0.8978, + "step": 490 + }, + { + "epoch": 0.14, + "learning_rate": 4.938445740961534e-05, + "loss": 0.9217, + "step": 500 + }, + { + "epoch": 0.14, + "learning_rate": 4.935969617957126e-05, + "loss": 0.8997, + "step": 510 + }, + { + "epoch": 0.15, + "learning_rate": 4.93344531465095e-05, + "loss": 0.9045, + "step": 520 + }, + { + "epoch": 0.15, + "learning_rate": 4.930872880970432e-05, + "loss": 0.8985, + "step": 530 + }, + { + "epoch": 0.15, + "learning_rate": 4.9282523677949556e-05, + "loss": 0.9171, + "step": 540 + }, + { + "epoch": 0.16, + "learning_rate": 4.9255838269548524e-05, + "loss": 0.9001, + "step": 550 + }, + { + "epoch": 0.16, + "learning_rate": 4.9228673112303814e-05, + "loss": 0.8824, + "step": 560 + }, + { + "epoch": 0.16, + "learning_rate": 4.9201028743506794e-05, + "loss": 0.9046, + "step": 570 + }, + { + "epoch": 0.16, + "learning_rate": 4.917290570992702e-05, + "loss": 0.8888, + "step": 580 + }, + { + "epoch": 0.17, + "learning_rate": 4.9144304567801415e-05, + "loss": 0.889, + "step": 590 + }, + { + "epoch": 0.17, + "learning_rate": 4.911522588282327e-05, + "loss": 0.906, + "step": 600 + }, + { + "epoch": 0.17, + "learning_rate": 4.908567023013104e-05, + "loss": 0.8858, + "step": 610 + }, + { + "epoch": 0.18, + "learning_rate": 4.9055638194296994e-05, + "loss": 0.8862, + "step": 620 + }, + { + "epoch": 0.18, + "learning_rate": 4.902513036931562e-05, + "loss": 0.8983, + "step": 630 + }, + { + "epoch": 0.18, + "learning_rate": 4.89941473585919e-05, + "loss": 0.8967, + "step": 640 + }, + { + "epoch": 0.18, + "learning_rate": 4.89626897749294e-05, + "loss": 0.8925, + "step": 650 + }, + { + "epoch": 0.19, + "learning_rate": 4.893075824051807e-05, + "loss": 0.883, + "step": 660 + }, + { + "epoch": 0.19, + "learning_rate": 4.889835338692201e-05, + "loss": 0.8823, + "step": 670 + }, + { + "epoch": 0.19, + "learning_rate": 4.886547585506698e-05, + "loss": 0.8937, + "step": 680 + }, + { + "epoch": 0.2, + "learning_rate": 4.8832126295227656e-05, + "loss": 0.8695, + "step": 690 + }, + { + "epoch": 0.2, + "learning_rate": 4.879830536701485e-05, + "loss": 0.8873, + "step": 700 + }, + { + "epoch": 0.2, + "learning_rate": 4.876401373936239e-05, + "loss": 0.8862, + "step": 710 + }, + { + "epoch": 0.2, + "learning_rate": 4.8729252090513964e-05, + "loss": 0.874, + "step": 720 + }, + { + "epoch": 0.21, + "learning_rate": 4.869402110800963e-05, + "loss": 0.8834, + "step": 730 + }, + { + "epoch": 0.21, + "learning_rate": 4.865832148867228e-05, + "loss": 0.8744, + "step": 740 + }, + { + "epoch": 0.21, + "learning_rate": 4.8622153938593816e-05, + "loss": 0.876, + "step": 750 + }, + { + "epoch": 0.22, + "learning_rate": 4.8585519173121205e-05, + "loss": 0.8874, + "step": 760 + }, + { + "epoch": 0.22, + "learning_rate": 4.8548417916842324e-05, + "loss": 0.8938, + "step": 770 + }, + { + "epoch": 0.22, + "learning_rate": 4.851085090357163e-05, + "loss": 0.8855, + "step": 780 + }, + { + "epoch": 0.22, + "learning_rate": 4.847281887633565e-05, + "loss": 0.8827, + "step": 790 + }, + { + "epoch": 0.23, + "learning_rate": 4.843432258735827e-05, + "loss": 0.8736, + "step": 800 + }, + { + "epoch": 0.23, + "learning_rate": 4.839536279804589e-05, + "loss": 0.8907, + "step": 810 + }, + { + "epoch": 0.23, + "learning_rate": 4.835594027897231e-05, + "loss": 0.862, + "step": 820 + }, + { + "epoch": 0.23, + "learning_rate": 4.831605580986355e-05, + "loss": 0.8796, + "step": 830 + }, + { + "epoch": 0.24, + "learning_rate": 4.8275710179582366e-05, + "loss": 0.8745, + "step": 840 + }, + { + "epoch": 0.24, + "learning_rate": 4.823490418611273e-05, + "loss": 0.8594, + "step": 850 + }, + { + "epoch": 0.24, + "learning_rate": 4.819363863654395e-05, + "loss": 0.8839, + "step": 860 + }, + { + "epoch": 0.25, + "learning_rate": 4.8151914347054776e-05, + "loss": 0.8536, + "step": 870 + }, + { + "epoch": 0.25, + "learning_rate": 4.810973214289724e-05, + "loss": 0.8765, + "step": 880 + }, + { + "epoch": 0.25, + "learning_rate": 4.806709285838031e-05, + "loss": 0.8726, + "step": 890 + }, + { + "epoch": 0.25, + "learning_rate": 4.8023997336853434e-05, + "loss": 0.8664, + "step": 900 + }, + { + "epoch": 0.26, + "learning_rate": 4.7980446430689804e-05, + "loss": 0.8805, + "step": 910 + }, + { + "epoch": 0.26, + "learning_rate": 4.793644100126954e-05, + "loss": 0.878, + "step": 920 + }, + { + "epoch": 0.26, + "learning_rate": 4.7891981918962656e-05, + "loss": 0.8632, + "step": 930 + }, + { + "epoch": 0.27, + "learning_rate": 4.784707006311179e-05, + "loss": 0.8614, + "step": 940 + }, + { + "epoch": 0.27, + "learning_rate": 4.780170632201487e-05, + "loss": 0.8629, + "step": 950 + }, + { + "epoch": 0.27, + "learning_rate": 4.7755891592907556e-05, + "loss": 0.8635, + "step": 960 + }, + { + "epoch": 0.27, + "learning_rate": 4.7709626781945397e-05, + "loss": 0.8525, + "step": 970 + }, + { + "epoch": 0.28, + "learning_rate": 4.766291280418603e-05, + "loss": 0.8592, + "step": 980 + }, + { + "epoch": 0.28, + "learning_rate": 4.761575058357101e-05, + "loss": 0.8621, + "step": 990 + }, + { + "epoch": 0.28, + "learning_rate": 4.756814105290753e-05, + "loss": 0.8687, + "step": 1000 + }, + { + "epoch": 0.29, + "learning_rate": 4.7520085153850014e-05, + "loss": 0.8524, + "step": 1010 + }, + { + "epoch": 0.29, + "learning_rate": 4.7471583836881476e-05, + "loss": 0.8687, + "step": 1020 + }, + { + "epoch": 0.29, + "learning_rate": 4.742263806129469e-05, + "loss": 0.8505, + "step": 1030 + }, + { + "epoch": 0.29, + "learning_rate": 4.737324879517326e-05, + "loss": 0.8754, + "step": 1040 + }, + { + "epoch": 0.3, + "learning_rate": 4.732341701537245e-05, + "loss": 0.8583, + "step": 1050 + }, + { + "epoch": 0.3, + "learning_rate": 4.727314370749988e-05, + "loss": 0.8698, + "step": 1060 + }, + { + "epoch": 0.3, + "learning_rate": 4.7222429865896e-05, + "loss": 0.8661, + "step": 1070 + }, + { + "epoch": 0.31, + "learning_rate": 4.717127649361444e-05, + "loss": 0.8574, + "step": 1080 + }, + { + "epoch": 0.31, + "learning_rate": 4.71196846024022e-05, + "loss": 0.852, + "step": 1090 + }, + { + "epoch": 0.31, + "learning_rate": 4.7067655212679585e-05, + "loss": 0.8619, + "step": 1100 + }, + { + "epoch": 0.31, + "learning_rate": 4.701518935352006e-05, + "loss": 0.8632, + "step": 1110 + }, + { + "epoch": 0.32, + "learning_rate": 4.69622880626299e-05, + "loss": 0.8529, + "step": 1120 + }, + { + "epoch": 0.32, + "learning_rate": 4.690895238632762e-05, + "loss": 0.8529, + "step": 1130 + }, + { + "epoch": 0.32, + "learning_rate": 4.685518337952335e-05, + "loss": 0.8465, + "step": 1140 + }, + { + "epoch": 0.33, + "learning_rate": 4.680098210569789e-05, + "loss": 0.8604, + "step": 1150 + }, + { + "epoch": 0.33, + "learning_rate": 4.674634963688177e-05, + "loss": 0.8649, + "step": 1160 + }, + { + "epoch": 0.33, + "learning_rate": 4.669128705363394e-05, + "loss": 0.8572, + "step": 1170 + }, + { + "epoch": 0.33, + "learning_rate": 4.663579544502049e-05, + "loss": 0.8634, + "step": 1180 + }, + { + "epoch": 0.34, + "learning_rate": 4.657987590859305e-05, + "loss": 0.8478, + "step": 1190 + }, + { + "epoch": 0.34, + "learning_rate": 4.652352955036713e-05, + "loss": 0.8475, + "step": 1200 + }, + { + "epoch": 0.34, + "learning_rate": 4.646675748480019e-05, + "loss": 0.8537, + "step": 1210 + }, + { + "epoch": 0.35, + "learning_rate": 4.640956083476964e-05, + "loss": 0.8499, + "step": 1220 + }, + { + "epoch": 0.35, + "learning_rate": 4.635194073155061e-05, + "loss": 0.8467, + "step": 1230 + }, + { + "epoch": 0.35, + "learning_rate": 4.62938983147936e-05, + "loss": 0.8538, + "step": 1240 + }, + { + "epoch": 0.35, + "learning_rate": 4.62354347325019e-05, + "loss": 0.8619, + "step": 1250 + }, + { + "epoch": 0.36, + "learning_rate": 4.6176551141008916e-05, + "loss": 0.8593, + "step": 1260 + }, + { + "epoch": 0.36, + "learning_rate": 4.611724870495528e-05, + "loss": 0.8484, + "step": 1270 + }, + { + "epoch": 0.36, + "learning_rate": 4.605752859726583e-05, + "loss": 0.8395, + "step": 1280 + }, + { + "epoch": 0.37, + "learning_rate": 4.5997391999126397e-05, + "loss": 0.8547, + "step": 1290 + }, + { + "epoch": 0.37, + "learning_rate": 4.5936840099960465e-05, + "loss": 0.8586, + "step": 1300 + }, + { + "epoch": 0.37, + "learning_rate": 4.587587409740561e-05, + "loss": 0.839, + "step": 1310 + }, + { + "epoch": 0.37, + "learning_rate": 4.581449519728986e-05, + "loss": 0.8417, + "step": 1320 + }, + { + "epoch": 0.38, + "learning_rate": 4.575270461360779e-05, + "loss": 0.8404, + "step": 1330 + }, + { + "epoch": 0.38, + "learning_rate": 4.569050356849655e-05, + "loss": 0.843, + "step": 1340 + }, + { + "epoch": 0.38, + "learning_rate": 4.562789329221169e-05, + "loss": 0.8557, + "step": 1350 + }, + { + "epoch": 0.39, + "learning_rate": 4.5564875023102796e-05, + "loss": 0.8504, + "step": 1360 + }, + { + "epoch": 0.39, + "learning_rate": 4.550145000758905e-05, + "loss": 0.8579, + "step": 1370 + }, + { + "epoch": 0.39, + "learning_rate": 4.543761950013453e-05, + "loss": 0.8563, + "step": 1380 + }, + { + "epoch": 0.39, + "learning_rate": 4.537338476322341e-05, + "loss": 0.8446, + "step": 1390 + }, + { + "epoch": 0.4, + "learning_rate": 4.530874706733502e-05, + "loss": 0.8524, + "step": 1400 + }, + { + "epoch": 0.4, + "learning_rate": 4.524370769091866e-05, + "loss": 0.8417, + "step": 1410 + }, + { + "epoch": 0.4, + "learning_rate": 4.5178267920368366e-05, + "loss": 0.8582, + "step": 1420 + }, + { + "epoch": 0.4, + "learning_rate": 4.511242904999746e-05, + "loss": 0.841, + "step": 1430 + }, + { + "epoch": 0.41, + "learning_rate": 4.50461923820129e-05, + "loss": 0.8529, + "step": 1440 + }, + { + "epoch": 0.41, + "learning_rate": 4.497955922648961e-05, + "loss": 0.8545, + "step": 1450 + }, + { + "epoch": 0.41, + "learning_rate": 4.491253090134447e-05, + "loss": 0.8471, + "step": 1460 + }, + { + "epoch": 0.42, + "learning_rate": 4.4845108732310355e-05, + "loss": 0.8379, + "step": 1470 + }, + { + "epoch": 0.42, + "learning_rate": 4.4777294052909804e-05, + "loss": 0.8542, + "step": 1480 + }, + { + "epoch": 0.42, + "learning_rate": 4.470908820442873e-05, + "loss": 0.8463, + "step": 1490 + }, + { + "epoch": 0.42, + "learning_rate": 4.464049253588985e-05, + "loss": 0.8362, + "step": 1500 + }, + { + "epoch": 0.43, + "learning_rate": 4.457150840402604e-05, + "loss": 0.8467, + "step": 1510 + }, + { + "epoch": 0.43, + "learning_rate": 4.450213717325343e-05, + "loss": 0.8501, + "step": 1520 + }, + { + "epoch": 0.43, + "learning_rate": 4.443238021564448e-05, + "loss": 0.8541, + "step": 1530 + }, + { + "epoch": 0.44, + "learning_rate": 4.4362238910900835e-05, + "loss": 0.8443, + "step": 1540 + }, + { + "epoch": 0.44, + "learning_rate": 4.4291714646326024e-05, + "loss": 0.8297, + "step": 1550 + }, + { + "epoch": 0.44, + "learning_rate": 4.4220808816797995e-05, + "loss": 0.8532, + "step": 1560 + }, + { + "epoch": 0.44, + "learning_rate": 4.414952282474158e-05, + "loss": 0.854, + "step": 1570 + }, + { + "epoch": 0.45, + "learning_rate": 4.407785808010073e-05, + "loss": 0.849, + "step": 1580 + }, + { + "epoch": 0.45, + "learning_rate": 4.400581600031062e-05, + "loss": 0.8516, + "step": 1590 + }, + { + "epoch": 0.45, + "learning_rate": 4.3933398010269614e-05, + "loss": 0.8394, + "step": 1600 + }, + { + "epoch": 0.46, + "learning_rate": 4.386060554231111e-05, + "loss": 0.8399, + "step": 1610 + }, + { + "epoch": 0.46, + "learning_rate": 4.378744003617517e-05, + "loss": 0.8242, + "step": 1620 + }, + { + "epoch": 0.46, + "learning_rate": 4.371390293898007e-05, + "loss": 0.8395, + "step": 1630 + }, + { + "epoch": 0.46, + "learning_rate": 4.3639995705193684e-05, + "loss": 0.8355, + "step": 1640 + }, + { + "epoch": 0.47, + "learning_rate": 4.3565719796604706e-05, + "loss": 0.8299, + "step": 1650 + }, + { + "epoch": 0.47, + "learning_rate": 4.3491076682293715e-05, + "loss": 0.8272, + "step": 1660 + }, + { + "epoch": 0.47, + "learning_rate": 4.341606783860416e-05, + "loss": 0.8336, + "step": 1670 + }, + { + "epoch": 0.48, + "learning_rate": 4.334069474911313e-05, + "loss": 0.8264, + "step": 1680 + }, + { + "epoch": 0.48, + "learning_rate": 4.326495890460204e-05, + "loss": 0.8381, + "step": 1690 + }, + { + "epoch": 0.48, + "learning_rate": 4.3188861803027094e-05, + "loss": 0.8278, + "step": 1700 + }, + { + "epoch": 0.48, + "learning_rate": 4.3112404949489715e-05, + "loss": 0.8458, + "step": 1710 + }, + { + "epoch": 0.49, + "learning_rate": 4.303558985620673e-05, + "loss": 0.8348, + "step": 1720 + }, + { + "epoch": 0.49, + "learning_rate": 4.2958418042480506e-05, + "loss": 0.814, + "step": 1730 + }, + { + "epoch": 0.49, + "learning_rate": 4.288089103466886e-05, + "loss": 0.838, + "step": 1740 + }, + { + "epoch": 0.5, + "learning_rate": 4.280301036615489e-05, + "loss": 0.824, + "step": 1750 + }, + { + "epoch": 0.5, + "learning_rate": 4.272477757731662e-05, + "loss": 0.8314, + "step": 1760 + }, + { + "epoch": 0.5, + "learning_rate": 4.2646194215496595e-05, + "loss": 0.821, + "step": 1770 + }, + { + "epoch": 0.5, + "learning_rate": 4.2567261834971206e-05, + "loss": 0.8311, + "step": 1780 + }, + { + "epoch": 0.51, + "learning_rate": 4.248798199691998e-05, + "loss": 0.8443, + "step": 1790 + }, + { + "epoch": 0.51, + "learning_rate": 4.2408356269394714e-05, + "loss": 0.8315, + "step": 1800 + }, + { + "epoch": 0.51, + "learning_rate": 4.2328386227288445e-05, + "loss": 0.8184, + "step": 1810 + }, + { + "epoch": 0.52, + "learning_rate": 4.224807345230429e-05, + "loss": 0.8364, + "step": 1820 + }, + { + "epoch": 0.52, + "learning_rate": 4.21674195329242e-05, + "loss": 0.8186, + "step": 1830 + }, + { + "epoch": 0.52, + "learning_rate": 4.208642606437748e-05, + "loss": 0.8454, + "step": 1840 + }, + { + "epoch": 0.52, + "learning_rate": 4.2005094648609325e-05, + "loss": 0.832, + "step": 1850 + }, + { + "epoch": 0.53, + "learning_rate": 4.192342689424903e-05, + "loss": 0.8027, + "step": 1860 + }, + { + "epoch": 0.53, + "learning_rate": 4.184142441657827e-05, + "loss": 0.8365, + "step": 1870 + }, + { + "epoch": 0.53, + "learning_rate": 4.1759088837499095e-05, + "loss": 0.8523, + "step": 1880 + }, + { + "epoch": 0.54, + "learning_rate": 4.167642178550186e-05, + "loss": 0.8377, + "step": 1890 + }, + { + "epoch": 0.54, + "learning_rate": 4.159342489563304e-05, + "loss": 0.8299, + "step": 1900 + }, + { + "epoch": 0.54, + "learning_rate": 4.151009980946287e-05, + "loss": 0.8273, + "step": 1910 + }, + { + "epoch": 0.54, + "learning_rate": 4.142644817505284e-05, + "loss": 0.813, + "step": 1920 + }, + { + "epoch": 0.55, + "learning_rate": 4.1342471646923196e-05, + "loss": 0.8262, + "step": 1930 + }, + { + "epoch": 0.55, + "learning_rate": 4.1258171886020124e-05, + "loss": 0.8258, + "step": 1940 + }, + { + "epoch": 0.55, + "learning_rate": 4.117355055968295e-05, + "loss": 0.8248, + "step": 1950 + }, + { + "epoch": 0.55, + "learning_rate": 4.1088609341611135e-05, + "loss": 0.8123, + "step": 1960 + }, + { + "epoch": 0.56, + "learning_rate": 4.1003349911831166e-05, + "loss": 0.8304, + "step": 1970 + }, + { + "epoch": 0.56, + "learning_rate": 4.091777395666338e-05, + "loss": 0.849, + "step": 1980 + }, + { + "epoch": 0.56, + "learning_rate": 4.0831883168688534e-05, + "loss": 0.8255, + "step": 1990 + }, + { + "epoch": 0.57, + "learning_rate": 4.07456792467144e-05, + "loss": 0.8317, + "step": 2000 + }, + { + "epoch": 0.57, + "learning_rate": 4.065916389574211e-05, + "loss": 0.8331, + "step": 2010 + }, + { + "epoch": 0.57, + "learning_rate": 4.057233882693246e-05, + "loss": 0.8309, + "step": 2020 + }, + { + "epoch": 0.57, + "learning_rate": 4.048520575757207e-05, + "loss": 0.8117, + "step": 2030 + }, + { + "epoch": 0.58, + "learning_rate": 4.0397766411039395e-05, + "loss": 0.8155, + "step": 2040 + }, + { + "epoch": 0.58, + "learning_rate": 4.031002251677067e-05, + "loss": 0.8178, + "step": 2050 + }, + { + "epoch": 0.58, + "learning_rate": 4.022197581022567e-05, + "loss": 0.8155, + "step": 2060 + }, + { + "epoch": 0.59, + "learning_rate": 4.0133628032853435e-05, + "loss": 0.8273, + "step": 2070 + }, + { + "epoch": 0.59, + "learning_rate": 4.004498093205773e-05, + "loss": 0.8021, + "step": 2080 + }, + { + "epoch": 0.59, + "learning_rate": 3.99560362611626e-05, + "loss": 0.8374, + "step": 2090 + }, + { + "epoch": 0.59, + "learning_rate": 3.986679577937762e-05, + "loss": 0.8173, + "step": 2100 + }, + { + "epoch": 0.6, + "learning_rate": 3.9777261251763145e-05, + "loss": 0.8227, + "step": 2110 + }, + { + "epoch": 0.6, + "learning_rate": 3.9687434449195316e-05, + "loss": 0.8275, + "step": 2120 + }, + { + "epoch": 0.6, + "learning_rate": 3.959731714833115e-05, + "loss": 0.8226, + "step": 2130 + }, + { + "epoch": 0.61, + "learning_rate": 3.95069111315733e-05, + "loss": 0.815, + "step": 2140 + }, + { + "epoch": 0.61, + "learning_rate": 3.9416218187034876e-05, + "loss": 0.8306, + "step": 2150 + }, + { + "epoch": 0.61, + "learning_rate": 3.9325240108504016e-05, + "loss": 0.8424, + "step": 2160 + }, + { + "epoch": 0.61, + "learning_rate": 3.923397869540845e-05, + "loss": 0.8051, + "step": 2170 + }, + { + "epoch": 0.62, + "learning_rate": 3.91424357527799e-05, + "loss": 0.8117, + "step": 2180 + }, + { + "epoch": 0.62, + "learning_rate": 3.905061309121837e-05, + "loss": 0.8123, + "step": 2190 + }, + { + "epoch": 0.62, + "learning_rate": 3.895851252685634e-05, + "loss": 0.8038, + "step": 2200 + }, + { + "epoch": 0.63, + "learning_rate": 3.886613588132284e-05, + "loss": 0.8308, + "step": 2210 + }, + { + "epoch": 0.63, + "learning_rate": 3.877348498170743e-05, + "loss": 0.8187, + "step": 2220 + }, + { + "epoch": 0.63, + "learning_rate": 3.868056166052407e-05, + "loss": 0.8274, + "step": 2230 + }, + { + "epoch": 0.63, + "learning_rate": 3.858736775567484e-05, + "loss": 0.8171, + "step": 2240 + }, + { + "epoch": 0.64, + "learning_rate": 3.8493905110413626e-05, + "loss": 0.8213, + "step": 2250 + }, + { + "epoch": 0.64, + "learning_rate": 3.8400175573309646e-05, + "loss": 0.8241, + "step": 2260 + }, + { + "epoch": 0.64, + "learning_rate": 3.83061809982109e-05, + "loss": 0.8296, + "step": 2270 + }, + { + "epoch": 0.65, + "learning_rate": 3.821192324420747e-05, + "loss": 0.8247, + "step": 2280 + }, + { + "epoch": 0.65, + "learning_rate": 3.8117404175594795e-05, + "loss": 0.8399, + "step": 2290 + }, + { + "epoch": 0.65, + "learning_rate": 3.8022625661836775e-05, + "loss": 0.8015, + "step": 2300 + }, + { + "epoch": 0.65, + "learning_rate": 3.792758957752879e-05, + "loss": 0.8204, + "step": 2310 + }, + { + "epoch": 0.66, + "learning_rate": 3.783229780236062e-05, + "loss": 0.8198, + "step": 2320 + }, + { + "epoch": 0.66, + "learning_rate": 3.773675222107929e-05, + "loss": 0.8045, + "step": 2330 + }, + { + "epoch": 0.66, + "learning_rate": 3.7640954723451784e-05, + "loss": 0.8185, + "step": 2340 + }, + { + "epoch": 0.67, + "learning_rate": 3.7544907204227646e-05, + "loss": 0.8123, + "step": 2350 + }, + { + "epoch": 0.67, + "learning_rate": 3.7448611563101536e-05, + "loss": 0.8093, + "step": 2360 + }, + { + "epoch": 0.67, + "learning_rate": 3.735206970467564e-05, + "loss": 0.8194, + "step": 2370 + }, + { + "epoch": 0.67, + "learning_rate": 3.7255283538421984e-05, + "loss": 0.8121, + "step": 2380 + }, + { + "epoch": 0.68, + "learning_rate": 3.7158254978644703e-05, + "loss": 0.811, + "step": 2390 + }, + { + "epoch": 0.68, + "learning_rate": 3.706098594444216e-05, + "loss": 0.8013, + "step": 2400 + }, + { + "epoch": 0.68, + "learning_rate": 3.6963478359668966e-05, + "loss": 0.8215, + "step": 2410 + }, + { + "epoch": 0.69, + "learning_rate": 3.6865734152897987e-05, + "loss": 0.8079, + "step": 2420 + }, + { + "epoch": 0.69, + "learning_rate": 3.676775525738213e-05, + "loss": 0.821, + "step": 2430 + }, + { + "epoch": 0.69, + "learning_rate": 3.666954361101616e-05, + "loss": 0.8097, + "step": 2440 + }, + { + "epoch": 0.69, + "learning_rate": 3.657110115629832e-05, + "loss": 0.8046, + "step": 2450 + }, + { + "epoch": 0.7, + "learning_rate": 3.647242984029201e-05, + "loss": 0.8112, + "step": 2460 + }, + { + "epoch": 0.7, + "learning_rate": 3.637353161458713e-05, + "loss": 0.8099, + "step": 2470 + }, + { + "epoch": 0.7, + "learning_rate": 3.627440843526158e-05, + "loss": 0.8148, + "step": 2480 + }, + { + "epoch": 0.7, + "learning_rate": 3.6175062262842585e-05, + "loss": 0.8105, + "step": 2490 + }, + { + "epoch": 0.71, + "learning_rate": 3.607549506226784e-05, + "loss": 0.8132, + "step": 2500 + }, + { + "epoch": 0.71, + "learning_rate": 3.5975708802846725e-05, + "loss": 0.8149, + "step": 2510 + }, + { + "epoch": 0.71, + "learning_rate": 3.587570545822128e-05, + "loss": 0.8306, + "step": 2520 + }, + { + "epoch": 0.72, + "learning_rate": 3.5775487006327215e-05, + "loss": 0.8106, + "step": 2530 + }, + { + "epoch": 0.72, + "learning_rate": 3.567505542935482e-05, + "loss": 0.8192, + "step": 2540 + }, + { + "epoch": 0.72, + "learning_rate": 3.557441271370968e-05, + "loss": 0.8129, + "step": 2550 + }, + { + "epoch": 0.72, + "learning_rate": 3.547356084997344e-05, + "loss": 0.8155, + "step": 2560 + }, + { + "epoch": 0.73, + "learning_rate": 3.537250183286443e-05, + "loss": 0.8039, + "step": 2570 + }, + { + "epoch": 0.73, + "learning_rate": 3.527123766119818e-05, + "loss": 0.8109, + "step": 2580 + }, + { + "epoch": 0.73, + "learning_rate": 3.5169770337847935e-05, + "loss": 0.8063, + "step": 2590 + }, + { + "epoch": 0.74, + "learning_rate": 3.5068101869705004e-05, + "loss": 0.8275, + "step": 2600 + }, + { + "epoch": 0.74, + "learning_rate": 3.496623426763908e-05, + "loss": 0.8107, + "step": 2610 + }, + { + "epoch": 0.74, + "learning_rate": 3.486416954645846e-05, + "loss": 0.8047, + "step": 2620 + }, + { + "epoch": 0.74, + "learning_rate": 3.4761909724870205e-05, + "loss": 0.8123, + "step": 2630 + }, + { + "epoch": 0.75, + "learning_rate": 3.4659456825440216e-05, + "loss": 0.8241, + "step": 2640 + }, + { + "epoch": 0.75, + "learning_rate": 3.4556812874553204e-05, + "loss": 0.812, + "step": 2650 + }, + { + "epoch": 0.75, + "learning_rate": 3.445397990237264e-05, + "loss": 0.8161, + "step": 2660 + }, + { + "epoch": 0.76, + "learning_rate": 3.4350959942800584e-05, + "loss": 0.797, + "step": 2670 + }, + { + "epoch": 0.76, + "learning_rate": 3.424775503343747e-05, + "loss": 0.8155, + "step": 2680 + }, + { + "epoch": 0.76, + "learning_rate": 3.414436721554179e-05, + "loss": 0.797, + "step": 2690 + }, + { + "epoch": 0.76, + "learning_rate": 3.4040798533989745e-05, + "loss": 0.8153, + "step": 2700 + }, + { + "epoch": 0.77, + "learning_rate": 3.3937051037234745e-05, + "loss": 0.8016, + "step": 2710 + }, + { + "epoch": 0.77, + "learning_rate": 3.3833126777266974e-05, + "loss": 0.8138, + "step": 2720 + }, + { + "epoch": 0.77, + "learning_rate": 3.3729027809572735e-05, + "loss": 0.8178, + "step": 2730 + }, + { + "epoch": 0.78, + "learning_rate": 3.3624756193093835e-05, + "loss": 0.8062, + "step": 2740 + }, + { + "epoch": 0.78, + "learning_rate": 3.3520313990186856e-05, + "loss": 0.8101, + "step": 2750 + }, + { + "epoch": 0.78, + "learning_rate": 3.341570326658232e-05, + "loss": 0.7982, + "step": 2760 + }, + { + "epoch": 0.78, + "learning_rate": 3.331092609134392e-05, + "loss": 0.8021, + "step": 2770 + }, + { + "epoch": 0.79, + "learning_rate": 3.32059845368275e-05, + "loss": 0.817, + "step": 2780 + }, + { + "epoch": 0.79, + "learning_rate": 3.310088067864015e-05, + "loss": 0.8083, + "step": 2790 + }, + { + "epoch": 0.79, + "learning_rate": 3.299561659559909e-05, + "loss": 0.8047, + "step": 2800 + }, + { + "epoch": 0.8, + "learning_rate": 3.289019436969057e-05, + "loss": 0.8, + "step": 2810 + }, + { + "epoch": 0.8, + "learning_rate": 3.278461608602873e-05, + "loss": 0.8063, + "step": 2820 + }, + { + "epoch": 0.8, + "learning_rate": 3.267888383281431e-05, + "loss": 0.8139, + "step": 2830 + }, + { + "epoch": 0.8, + "learning_rate": 3.257299970129336e-05, + "loss": 0.8075, + "step": 2840 + }, + { + "epoch": 0.81, + "learning_rate": 3.246696578571592e-05, + "loss": 0.8056, + "step": 2850 + }, + { + "epoch": 0.81, + "learning_rate": 3.236078418329452e-05, + "loss": 0.8242, + "step": 2860 + }, + { + "epoch": 0.81, + "learning_rate": 3.225445699416276e-05, + "loss": 0.8041, + "step": 2870 + }, + { + "epoch": 0.82, + "learning_rate": 3.214798632133376e-05, + "loss": 0.8088, + "step": 2880 + }, + { + "epoch": 0.82, + "learning_rate": 3.204137427065857e-05, + "loss": 0.8121, + "step": 2890 + }, + { + "epoch": 0.82, + "learning_rate": 3.193462295078448e-05, + "loss": 0.8151, + "step": 2900 + }, + { + "epoch": 0.82, + "learning_rate": 3.1827734473113356e-05, + "loss": 0.8064, + "step": 2910 + }, + { + "epoch": 0.83, + "learning_rate": 3.172071095175989e-05, + "loss": 0.8151, + "step": 2920 + }, + { + "epoch": 0.83, + "learning_rate": 3.1613554503509715e-05, + "loss": 0.7942, + "step": 2930 + }, + { + "epoch": 0.83, + "learning_rate": 3.1506267247777645e-05, + "loss": 0.8131, + "step": 2940 + }, + { + "epoch": 0.84, + "learning_rate": 3.139885130656563e-05, + "loss": 0.8015, + "step": 2950 + }, + { + "epoch": 0.84, + "learning_rate": 3.129130880442091e-05, + "loss": 0.8053, + "step": 2960 + }, + { + "epoch": 0.84, + "learning_rate": 3.118364186839389e-05, + "loss": 0.7986, + "step": 2970 + }, + { + "epoch": 0.84, + "learning_rate": 3.107585262799613e-05, + "loss": 0.7936, + "step": 2980 + }, + { + "epoch": 0.85, + "learning_rate": 3.096794321515823e-05, + "loss": 0.8235, + "step": 2990 + }, + { + "epoch": 0.85, + "learning_rate": 3.0859915764187616e-05, + "loss": 0.8083, + "step": 3000 + }, + { + "epoch": 0.85, + "learning_rate": 3.075177241172637e-05, + "loss": 0.8081, + "step": 3010 + }, + { + "epoch": 0.86, + "learning_rate": 3.064351529670895e-05, + "loss": 0.7981, + "step": 3020 + }, + { + "epoch": 0.86, + "learning_rate": 3.0535146560319895e-05, + "loss": 0.8152, + "step": 3030 + }, + { + "epoch": 0.86, + "learning_rate": 3.0426668345951448e-05, + "loss": 0.8091, + "step": 3040 + }, + { + "epoch": 0.86, + "learning_rate": 3.031808279916121e-05, + "loss": 0.8206, + "step": 3050 + }, + { + "epoch": 0.87, + "learning_rate": 3.0209392067629676e-05, + "loss": 0.7947, + "step": 3060 + }, + { + "epoch": 0.87, + "learning_rate": 3.010059830111773e-05, + "loss": 0.8116, + "step": 3070 + }, + { + "epoch": 0.87, + "learning_rate": 2.9991703651424184e-05, + "loss": 0.8135, + "step": 3080 + }, + { + "epoch": 0.87, + "learning_rate": 2.988271027234317e-05, + "loss": 0.8032, + "step": 3090 + }, + { + "epoch": 0.88, + "learning_rate": 2.977362031962158e-05, + "loss": 0.8023, + "step": 3100 + }, + { + "epoch": 0.88, + "learning_rate": 2.966443595091637e-05, + "loss": 0.8116, + "step": 3110 + }, + { + "epoch": 0.88, + "learning_rate": 2.9555159325751947e-05, + "loss": 0.8048, + "step": 3120 + }, + { + "epoch": 0.89, + "learning_rate": 2.9445792605477433e-05, + "loss": 0.8032, + "step": 3130 + }, + { + "epoch": 0.89, + "learning_rate": 2.933633795322391e-05, + "loss": 0.808, + "step": 3140 + }, + { + "epoch": 0.89, + "learning_rate": 2.9226797533861615e-05, + "loss": 0.8057, + "step": 3150 + }, + { + "epoch": 0.89, + "learning_rate": 2.9117173513957186e-05, + "loss": 0.8013, + "step": 3160 + }, + { + "epoch": 0.9, + "learning_rate": 2.900746806173074e-05, + "loss": 0.802, + "step": 3170 + }, + { + "epoch": 0.9, + "learning_rate": 2.889768334701305e-05, + "loss": 0.804, + "step": 3180 + }, + { + "epoch": 0.9, + "learning_rate": 2.8787821541202564e-05, + "loss": 0.8, + "step": 3190 + }, + { + "epoch": 0.91, + "learning_rate": 2.8677884817222505e-05, + "loss": 0.7983, + "step": 3200 + }, + { + "epoch": 0.91, + "learning_rate": 2.856787534947789e-05, + "loss": 0.8083, + "step": 3210 + }, + { + "epoch": 0.91, + "learning_rate": 2.8457795313812507e-05, + "loss": 0.8203, + "step": 3220 + }, + { + "epoch": 0.91, + "learning_rate": 2.8347646887465867e-05, + "loss": 0.792, + "step": 3230 + }, + { + "epoch": 0.92, + "learning_rate": 2.8237432249030183e-05, + "loss": 0.8006, + "step": 3240 + }, + { + "epoch": 0.92, + "learning_rate": 2.812715357840725e-05, + "loss": 0.7953, + "step": 3250 + }, + { + "epoch": 0.92, + "learning_rate": 2.801681305676534e-05, + "loss": 0.8057, + "step": 3260 + }, + { + "epoch": 0.93, + "learning_rate": 2.7906412866496034e-05, + "loss": 0.8005, + "step": 3270 + }, + { + "epoch": 0.93, + "learning_rate": 2.7795955191171114e-05, + "loss": 0.8082, + "step": 3280 + }, + { + "epoch": 0.93, + "learning_rate": 2.7685442215499323e-05, + "loss": 0.811, + "step": 3290 + }, + { + "epoch": 0.93, + "learning_rate": 2.7574876125283176e-05, + "loss": 0.7981, + "step": 3300 + }, + { + "epoch": 0.94, + "learning_rate": 2.7464259107375722e-05, + "loss": 0.8018, + "step": 3310 + }, + { + "epoch": 0.94, + "learning_rate": 2.7353593349637297e-05, + "loss": 0.7991, + "step": 3320 + }, + { + "epoch": 0.94, + "learning_rate": 2.7242881040892255e-05, + "loss": 0.8057, + "step": 3330 + }, + { + "epoch": 0.95, + "learning_rate": 2.713212437088564e-05, + "loss": 0.8156, + "step": 3340 + }, + { + "epoch": 0.95, + "learning_rate": 2.702132553023993e-05, + "loss": 0.8003, + "step": 3350 + }, + { + "epoch": 0.95, + "learning_rate": 2.691048671041169e-05, + "loss": 0.7976, + "step": 3360 + }, + { + "epoch": 0.95, + "learning_rate": 2.6799610103648197e-05, + "loss": 0.7894, + "step": 3370 + }, + { + "epoch": 0.96, + "learning_rate": 2.668869790294411e-05, + "loss": 0.7953, + "step": 3380 + }, + { + "epoch": 0.96, + "learning_rate": 2.6577752301998098e-05, + "loss": 0.8124, + "step": 3390 + }, + { + "epoch": 0.96, + "learning_rate": 2.6466775495169437e-05, + "loss": 0.8073, + "step": 3400 + }, + { + "epoch": 0.97, + "learning_rate": 2.6355769677434628e-05, + "loss": 0.7979, + "step": 3410 + }, + { + "epoch": 0.97, + "learning_rate": 2.6244737044343954e-05, + "loss": 0.8023, + "step": 3420 + }, + { + "epoch": 0.97, + "learning_rate": 2.6133679791978065e-05, + "loss": 0.8046, + "step": 3430 + }, + { + "epoch": 0.97, + "learning_rate": 2.602260011690457e-05, + "loss": 0.8082, + "step": 3440 + }, + { + "epoch": 0.98, + "learning_rate": 2.591150021613456e-05, + "loss": 0.7868, + "step": 3450 + }, + { + "epoch": 0.98, + "learning_rate": 2.580038228707916e-05, + "loss": 0.7938, + "step": 3460 + }, + { + "epoch": 0.98, + "learning_rate": 2.568924852750607e-05, + "loss": 0.8215, + "step": 3470 + }, + { + "epoch": 0.99, + "learning_rate": 2.55781011354961e-05, + "loss": 0.807, + "step": 3480 + }, + { + "epoch": 0.99, + "learning_rate": 2.5466942309399706e-05, + "loss": 0.7878, + "step": 3490 + }, + { + "epoch": 0.99, + "learning_rate": 2.535577424779347e-05, + "loss": 0.7968, + "step": 3500 + }, + { + "epoch": 0.99, + "learning_rate": 2.5244599149436642e-05, + "loss": 0.787, + "step": 3510 + }, + { + "epoch": 1.0, + "learning_rate": 2.5133419213227684e-05, + "loss": 0.8011, + "step": 3520 + }, + { + "epoch": 1.0, + "learning_rate": 2.5022236638160712e-05, + "loss": 0.8086, + "step": 3530 + }, + { + "epoch": 1.0, + "learning_rate": 2.491105362328204e-05, + "loss": 0.8125, + "step": 3540 + }, + { + "epoch": 1.01, + "learning_rate": 2.4799872367646685e-05, + "loss": 0.8125, + "step": 3550 + }, + { + "epoch": 1.01, + "learning_rate": 2.468869507027486e-05, + "loss": 0.7805, + "step": 3560 + }, + { + "epoch": 1.01, + "learning_rate": 2.457752393010851e-05, + "loss": 0.817, + "step": 3570 + }, + { + "epoch": 1.01, + "learning_rate": 2.4466361145967782e-05, + "loss": 0.8056, + "step": 3580 + }, + { + "epoch": 1.02, + "learning_rate": 2.4355208916507554e-05, + "loss": 0.7752, + "step": 3590 + }, + { + "epoch": 1.02, + "learning_rate": 2.4244069440173938e-05, + "loss": 0.7749, + "step": 3600 + }, + { + "epoch": 1.02, + "learning_rate": 2.413294491516083e-05, + "loss": 0.8073, + "step": 3610 + }, + { + "epoch": 1.02, + "learning_rate": 2.402183753936639e-05, + "loss": 0.8117, + "step": 3620 + }, + { + "epoch": 1.03, + "learning_rate": 2.3910749510349574e-05, + "loss": 0.8008, + "step": 3630 + }, + { + "epoch": 1.03, + "learning_rate": 2.3799683025286727e-05, + "loss": 0.8028, + "step": 3640 + }, + { + "epoch": 1.03, + "learning_rate": 2.3688640280928043e-05, + "loss": 0.7974, + "step": 3650 + }, + { + "epoch": 1.04, + "learning_rate": 2.357762347355418e-05, + "loss": 0.7867, + "step": 3660 + }, + { + "epoch": 1.04, + "learning_rate": 2.346663479893277e-05, + "loss": 0.8002, + "step": 3670 + }, + { + "epoch": 1.04, + "learning_rate": 2.3355676452275057e-05, + "loss": 0.8095, + "step": 3680 + }, + { + "epoch": 1.04, + "learning_rate": 2.3244750628192395e-05, + "loss": 0.7847, + "step": 3690 + }, + { + "epoch": 1.05, + "learning_rate": 2.313385952065291e-05, + "loss": 0.7693, + "step": 3700 + }, + { + "epoch": 1.05, + "learning_rate": 2.302300532293806e-05, + "loss": 0.8078, + "step": 3710 + }, + { + "epoch": 1.05, + "learning_rate": 2.2912190227599305e-05, + "loss": 0.7925, + "step": 3720 + }, + { + "epoch": 1.06, + "learning_rate": 2.280141642641468e-05, + "loss": 0.77, + "step": 3730 + }, + { + "epoch": 1.06, + "learning_rate": 2.26906861103455e-05, + "loss": 0.7962, + "step": 3740 + }, + { + "epoch": 1.06, + "learning_rate": 2.2580001469492968e-05, + "loss": 0.8014, + "step": 3750 + }, + { + "epoch": 1.06, + "learning_rate": 2.2469364693054938e-05, + "loss": 0.7934, + "step": 3760 + }, + { + "epoch": 1.07, + "learning_rate": 2.235877796928252e-05, + "loss": 0.7978, + "step": 3770 + }, + { + "epoch": 1.07, + "learning_rate": 2.2248243485436892e-05, + "loss": 0.8022, + "step": 3780 + }, + { + "epoch": 1.07, + "learning_rate": 2.213776342774595e-05, + "loss": 0.7934, + "step": 3790 + }, + { + "epoch": 1.08, + "learning_rate": 2.2027339981361156e-05, + "loss": 0.7975, + "step": 3800 + }, + { + "epoch": 1.08, + "learning_rate": 2.1916975330314235e-05, + "loss": 0.807, + "step": 3810 + }, + { + "epoch": 1.08, + "learning_rate": 2.1806671657474048e-05, + "loss": 0.7754, + "step": 3820 + }, + { + "epoch": 1.08, + "learning_rate": 2.1696431144503356e-05, + "loss": 0.7977, + "step": 3830 + }, + { + "epoch": 1.09, + "learning_rate": 2.1586255971815738e-05, + "loss": 0.7922, + "step": 3840 + }, + { + "epoch": 1.09, + "learning_rate": 2.147614831853239e-05, + "loss": 0.7862, + "step": 3850 + }, + { + "epoch": 1.09, + "learning_rate": 2.136611036243908e-05, + "loss": 0.7918, + "step": 3860 + }, + { + "epoch": 1.1, + "learning_rate": 2.1256144279943066e-05, + "loss": 0.781, + "step": 3870 + }, + { + "epoch": 1.1, + "learning_rate": 2.114625224603002e-05, + "loss": 0.7786, + "step": 3880 + }, + { + "epoch": 1.1, + "learning_rate": 2.1036436434221048e-05, + "loss": 0.8067, + "step": 3890 + }, + { + "epoch": 1.1, + "learning_rate": 2.0926699016529656e-05, + "loss": 0.7755, + "step": 3900 + }, + { + "epoch": 1.11, + "learning_rate": 2.0817042163418858e-05, + "loss": 0.7958, + "step": 3910 + }, + { + "epoch": 1.11, + "learning_rate": 2.0707468043758156e-05, + "loss": 0.8064, + "step": 3920 + }, + { + "epoch": 1.11, + "learning_rate": 2.059797882478074e-05, + "loss": 0.7967, + "step": 3930 + }, + { + "epoch": 1.12, + "learning_rate": 2.048857667204053e-05, + "loss": 0.8107, + "step": 3940 + }, + { + "epoch": 1.12, + "learning_rate": 2.0379263749369434e-05, + "loss": 0.7857, + "step": 3950 + }, + { + "epoch": 1.12, + "learning_rate": 2.027004221883447e-05, + "loss": 0.7732, + "step": 3960 + }, + { + "epoch": 1.12, + "learning_rate": 2.016091424069506e-05, + "loss": 0.7768, + "step": 3970 + }, + { + "epoch": 1.13, + "learning_rate": 2.0051881973360266e-05, + "loss": 0.7839, + "step": 3980 + }, + { + "epoch": 1.13, + "learning_rate": 1.9942947573346133e-05, + "loss": 0.7923, + "step": 3990 + }, + { + "epoch": 1.13, + "learning_rate": 1.9834113195233e-05, + "loss": 0.7994, + "step": 4000 + } + ], + "max_steps": 7064, + "num_train_epochs": 2, + "total_flos": 1.4165134656428573e+19, + "trial_name": null, + "trial_params": null +} diff --git a/sft-lora/checkpoint-4000/training_args.bin b/sft-lora/checkpoint-4000/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..3eed0ff4867b1994122fd7acbeae2361d0d3b65f --- /dev/null +++ b/sft-lora/checkpoint-4000/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f9990bd8d9bf61dcf0d79a1a831b0934c6cc3a114d136458fc4cdd6dc2a9387 +size 3272 diff --git a/sft-lora/checkpoint-5000/README.md b/sft-lora/checkpoint-5000/README.md new file mode 100644 index 0000000000000000000000000000000000000000..d290c902d52b2091d490255d35c9be86df84f437 --- /dev/null +++ b/sft-lora/checkpoint-5000/README.md @@ -0,0 +1,3 @@ +--- +library_name: peft +--- diff --git a/sft-lora/checkpoint-5000/adapter_config.json b/sft-lora/checkpoint-5000/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..2ef4676864a7f782259cd6700dcab8059e8973ab --- /dev/null +++ b/sft-lora/checkpoint-5000/adapter_config.json @@ -0,0 +1,20 @@ +{ + "base_model_name_or_path": "llama-13b-hf/", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layers_pattern": null, + "layers_to_transform": null, + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "revision": null, + "target_modules": [ + "q_proj", + "v_proj" + ], + "task_type": "CAUSAL_LM" +} \ No newline at end of file diff --git a/sft-lora/checkpoint-5000/adapter_model.bin b/sft-lora/checkpoint-5000/adapter_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..a608930593dce40b31982768d8b79a13eb876c86 --- /dev/null +++ b/sft-lora/checkpoint-5000/adapter_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75c5cfc4286a0be60fac158728fa37bddbfbc750d50470e09c4a135d475e9d3a +size 26269517 diff --git a/sft-lora/checkpoint-5000/finetuning_args.json b/sft-lora/checkpoint-5000/finetuning_args.json new file mode 100644 index 0000000000000000000000000000000000000000..36a921b3eb84159ad54e7697e9d7d3e2fde38fec --- /dev/null +++ b/sft-lora/checkpoint-5000/finetuning_args.json @@ -0,0 +1,13 @@ +{ + "finetuning_type": "lora", + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "lora_rank": 8, + "lora_target": [ + "q_proj", + "v_proj" + ], + "name_module_trainable": "mlp", + "num_hidden_layers": 32, + "num_layer_trainable": 3 +} diff --git a/sft-lora/checkpoint-5000/optimizer.pt b/sft-lora/checkpoint-5000/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..43a74e51a5407a5bea8a6429ce8cbaddf5912bc2 --- /dev/null +++ b/sft-lora/checkpoint-5000/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4793b5793aa90ea0107163b4d21a4112530ba023a5fa8103c9d8bda4fb7a55ae +size 52562821 diff --git a/sft-lora/checkpoint-5000/rng_state_0.pth b/sft-lora/checkpoint-5000/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..5da9a617f64d389af19f5d0d0570d46b200a2d90 --- /dev/null +++ b/sft-lora/checkpoint-5000/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa749ac37126149519409e153b6a8d5b3c73f6a7f974468df2f22c8609c043bb +size 18679 diff --git a/sft-lora/checkpoint-5000/rng_state_1.pth b/sft-lora/checkpoint-5000/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..920d8b2cf5e3bb4549e93a9710fdd148cabb282b --- /dev/null +++ b/sft-lora/checkpoint-5000/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba980348eaaec0de5f70f2b287f51dac0c18bf077ed911273607198816af372d +size 18679 diff --git a/sft-lora/checkpoint-5000/rng_state_2.pth b/sft-lora/checkpoint-5000/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..db173929b2ebb647af075a56648289e6a8da3f41 --- /dev/null +++ b/sft-lora/checkpoint-5000/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15ebbc42d20a73ad681f46a8a00221372524e938f097ed8d1826e8d19cdecbee +size 18679 diff --git a/sft-lora/checkpoint-5000/rng_state_3.pth b/sft-lora/checkpoint-5000/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..ce789088719c6cfacd5ae332c4d20e73956a21c5 --- /dev/null +++ b/sft-lora/checkpoint-5000/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3bba97ce2b3768f04f06dc80bc80340b192812258930e01279d032cfa9504c74 +size 18679 diff --git a/sft-lora/checkpoint-5000/scheduler.pt b/sft-lora/checkpoint-5000/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..93cd0dbf81609d0debef9fb5cda4c8acb8c059a5 --- /dev/null +++ b/sft-lora/checkpoint-5000/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db195081860175516ac4c042df5e0feb44c256b1465e3f90b62e8f0170baebb8 +size 627 diff --git a/sft-lora/checkpoint-5000/trainer_state.json b/sft-lora/checkpoint-5000/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..1f98a7b50378d2b3e286d744029f001d5dad30c3 --- /dev/null +++ b/sft-lora/checkpoint-5000/trainer_state.json @@ -0,0 +1,3016 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 1.4156285390713477, + "global_step": 5000, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.0, + "learning_rate": 4.9999752766303955e-05, + "loss": 1.293, + "step": 10 + }, + { + "epoch": 0.01, + "learning_rate": 4.999901107010577e-05, + "loss": 1.2584, + "step": 20 + }, + { + "epoch": 0.01, + "learning_rate": 4.999777492607524e-05, + "loss": 1.2075, + "step": 30 + }, + { + "epoch": 0.01, + "learning_rate": 4.9996044358661676e-05, + "loss": 1.1718, + "step": 40 + }, + { + "epoch": 0.01, + "learning_rate": 4.9993819402093446e-05, + "loss": 1.1483, + "step": 50 + }, + { + "epoch": 0.02, + "learning_rate": 4.999110010037728e-05, + "loss": 1.122, + "step": 60 + }, + { + "epoch": 0.02, + "learning_rate": 4.998788650729743e-05, + "loss": 1.0971, + "step": 70 + }, + { + "epoch": 0.02, + "learning_rate": 4.998417868641457e-05, + "loss": 1.0756, + "step": 80 + }, + { + "epoch": 0.03, + "learning_rate": 4.9979976711064556e-05, + "loss": 1.0673, + "step": 90 + }, + { + "epoch": 0.03, + "learning_rate": 4.9975280664357e-05, + "loss": 1.0705, + "step": 100 + }, + { + "epoch": 0.03, + "learning_rate": 4.997009063917356e-05, + "loss": 1.0673, + "step": 110 + }, + { + "epoch": 0.03, + "learning_rate": 4.996440673816617e-05, + "loss": 1.031, + "step": 120 + }, + { + "epoch": 0.04, + "learning_rate": 4.995822907375498e-05, + "loss": 1.0383, + "step": 130 + }, + { + "epoch": 0.04, + "learning_rate": 4.9951557768126136e-05, + "loss": 1.0097, + "step": 140 + }, + { + "epoch": 0.04, + "learning_rate": 4.9944392953229365e-05, + "loss": 1.012, + "step": 150 + }, + { + "epoch": 0.05, + "learning_rate": 4.993673477077535e-05, + "loss": 0.9834, + "step": 160 + }, + { + "epoch": 0.05, + "learning_rate": 4.9928583372232954e-05, + "loss": 0.9908, + "step": 170 + }, + { + "epoch": 0.05, + "learning_rate": 4.991993891882622e-05, + "loss": 0.9908, + "step": 180 + }, + { + "epoch": 0.05, + "learning_rate": 4.991080158153115e-05, + "loss": 0.9913, + "step": 190 + }, + { + "epoch": 0.06, + "learning_rate": 4.990117154107236e-05, + "loss": 0.9782, + "step": 200 + }, + { + "epoch": 0.06, + "learning_rate": 4.989104898791949e-05, + "loss": 0.9954, + "step": 210 + }, + { + "epoch": 0.06, + "learning_rate": 4.988043412228343e-05, + "loss": 0.975, + "step": 220 + }, + { + "epoch": 0.07, + "learning_rate": 4.986932715411239e-05, + "loss": 0.9687, + "step": 230 + }, + { + "epoch": 0.07, + "learning_rate": 4.985772830308771e-05, + "loss": 0.9677, + "step": 240 + }, + { + "epoch": 0.07, + "learning_rate": 4.9845637798619536e-05, + "loss": 0.9715, + "step": 250 + }, + { + "epoch": 0.07, + "learning_rate": 4.983305587984227e-05, + "loss": 0.9692, + "step": 260 + }, + { + "epoch": 0.08, + "learning_rate": 4.981998279560986e-05, + "loss": 0.9627, + "step": 270 + }, + { + "epoch": 0.08, + "learning_rate": 4.980641880449086e-05, + "loss": 0.9784, + "step": 280 + }, + { + "epoch": 0.08, + "learning_rate": 4.9792364174763323e-05, + "loss": 0.941, + "step": 290 + }, + { + "epoch": 0.08, + "learning_rate": 4.977781918440949e-05, + "loss": 0.9623, + "step": 300 + }, + { + "epoch": 0.09, + "learning_rate": 4.97627841211103e-05, + "loss": 0.9401, + "step": 310 + }, + { + "epoch": 0.09, + "learning_rate": 4.97472592822397e-05, + "loss": 0.9152, + "step": 320 + }, + { + "epoch": 0.09, + "learning_rate": 4.9731244974858746e-05, + "loss": 0.9405, + "step": 330 + }, + { + "epoch": 0.1, + "learning_rate": 4.971474151570955e-05, + "loss": 0.9431, + "step": 340 + }, + { + "epoch": 0.1, + "learning_rate": 4.9697749231209025e-05, + "loss": 0.9512, + "step": 350 + }, + { + "epoch": 0.1, + "learning_rate": 4.968026845744237e-05, + "loss": 0.9301, + "step": 360 + }, + { + "epoch": 0.1, + "learning_rate": 4.96622995401565e-05, + "loss": 0.917, + "step": 370 + }, + { + "epoch": 0.11, + "learning_rate": 4.9643842834753174e-05, + "loss": 0.9162, + "step": 380 + }, + { + "epoch": 0.11, + "learning_rate": 4.962489870628193e-05, + "loss": 0.9207, + "step": 390 + }, + { + "epoch": 0.11, + "learning_rate": 4.960546752943294e-05, + "loss": 0.924, + "step": 400 + }, + { + "epoch": 0.12, + "learning_rate": 4.958554968852952e-05, + "loss": 0.9025, + "step": 410 + }, + { + "epoch": 0.12, + "learning_rate": 4.95651455775206e-05, + "loss": 0.9027, + "step": 420 + }, + { + "epoch": 0.12, + "learning_rate": 4.954425559997287e-05, + "loss": 0.9167, + "step": 430 + }, + { + "epoch": 0.12, + "learning_rate": 4.952288016906284e-05, + "loss": 0.9119, + "step": 440 + }, + { + "epoch": 0.13, + "learning_rate": 4.9501019707568665e-05, + "loss": 0.9042, + "step": 450 + }, + { + "epoch": 0.13, + "learning_rate": 4.947867464786174e-05, + "loss": 0.9113, + "step": 460 + }, + { + "epoch": 0.13, + "learning_rate": 4.945584543189823e-05, + "loss": 0.9297, + "step": 470 + }, + { + "epoch": 0.14, + "learning_rate": 4.943253251121022e-05, + "loss": 0.9194, + "step": 480 + }, + { + "epoch": 0.14, + "learning_rate": 4.9408736346896894e-05, + "loss": 0.8978, + "step": 490 + }, + { + "epoch": 0.14, + "learning_rate": 4.938445740961534e-05, + "loss": 0.9217, + "step": 500 + }, + { + "epoch": 0.14, + "learning_rate": 4.935969617957126e-05, + "loss": 0.8997, + "step": 510 + }, + { + "epoch": 0.15, + "learning_rate": 4.93344531465095e-05, + "loss": 0.9045, + "step": 520 + }, + { + "epoch": 0.15, + "learning_rate": 4.930872880970432e-05, + "loss": 0.8985, + "step": 530 + }, + { + "epoch": 0.15, + "learning_rate": 4.9282523677949556e-05, + "loss": 0.9171, + "step": 540 + }, + { + "epoch": 0.16, + "learning_rate": 4.9255838269548524e-05, + "loss": 0.9001, + "step": 550 + }, + { + "epoch": 0.16, + "learning_rate": 4.9228673112303814e-05, + "loss": 0.8824, + "step": 560 + }, + { + "epoch": 0.16, + "learning_rate": 4.9201028743506794e-05, + "loss": 0.9046, + "step": 570 + }, + { + "epoch": 0.16, + "learning_rate": 4.917290570992702e-05, + "loss": 0.8888, + "step": 580 + }, + { + "epoch": 0.17, + "learning_rate": 4.9144304567801415e-05, + "loss": 0.889, + "step": 590 + }, + { + "epoch": 0.17, + "learning_rate": 4.911522588282327e-05, + "loss": 0.906, + "step": 600 + }, + { + "epoch": 0.17, + "learning_rate": 4.908567023013104e-05, + "loss": 0.8858, + "step": 610 + }, + { + "epoch": 0.18, + "learning_rate": 4.9055638194296994e-05, + "loss": 0.8862, + "step": 620 + }, + { + "epoch": 0.18, + "learning_rate": 4.902513036931562e-05, + "loss": 0.8983, + "step": 630 + }, + { + "epoch": 0.18, + "learning_rate": 4.89941473585919e-05, + "loss": 0.8967, + "step": 640 + }, + { + "epoch": 0.18, + "learning_rate": 4.89626897749294e-05, + "loss": 0.8925, + "step": 650 + }, + { + "epoch": 0.19, + "learning_rate": 4.893075824051807e-05, + "loss": 0.883, + "step": 660 + }, + { + "epoch": 0.19, + "learning_rate": 4.889835338692201e-05, + "loss": 0.8823, + "step": 670 + }, + { + "epoch": 0.19, + "learning_rate": 4.886547585506698e-05, + "loss": 0.8937, + "step": 680 + }, + { + "epoch": 0.2, + "learning_rate": 4.8832126295227656e-05, + "loss": 0.8695, + "step": 690 + }, + { + "epoch": 0.2, + "learning_rate": 4.879830536701485e-05, + "loss": 0.8873, + "step": 700 + }, + { + "epoch": 0.2, + "learning_rate": 4.876401373936239e-05, + "loss": 0.8862, + "step": 710 + }, + { + "epoch": 0.2, + "learning_rate": 4.8729252090513964e-05, + "loss": 0.874, + "step": 720 + }, + { + "epoch": 0.21, + "learning_rate": 4.869402110800963e-05, + "loss": 0.8834, + "step": 730 + }, + { + "epoch": 0.21, + "learning_rate": 4.865832148867228e-05, + "loss": 0.8744, + "step": 740 + }, + { + "epoch": 0.21, + "learning_rate": 4.8622153938593816e-05, + "loss": 0.876, + "step": 750 + }, + { + "epoch": 0.22, + "learning_rate": 4.8585519173121205e-05, + "loss": 0.8874, + "step": 760 + }, + { + "epoch": 0.22, + "learning_rate": 4.8548417916842324e-05, + "loss": 0.8938, + "step": 770 + }, + { + "epoch": 0.22, + "learning_rate": 4.851085090357163e-05, + "loss": 0.8855, + "step": 780 + }, + { + "epoch": 0.22, + "learning_rate": 4.847281887633565e-05, + "loss": 0.8827, + "step": 790 + }, + { + "epoch": 0.23, + "learning_rate": 4.843432258735827e-05, + "loss": 0.8736, + "step": 800 + }, + { + "epoch": 0.23, + "learning_rate": 4.839536279804589e-05, + "loss": 0.8907, + "step": 810 + }, + { + "epoch": 0.23, + "learning_rate": 4.835594027897231e-05, + "loss": 0.862, + "step": 820 + }, + { + "epoch": 0.23, + "learning_rate": 4.831605580986355e-05, + "loss": 0.8796, + "step": 830 + }, + { + "epoch": 0.24, + "learning_rate": 4.8275710179582366e-05, + "loss": 0.8745, + "step": 840 + }, + { + "epoch": 0.24, + "learning_rate": 4.823490418611273e-05, + "loss": 0.8594, + "step": 850 + }, + { + "epoch": 0.24, + "learning_rate": 4.819363863654395e-05, + "loss": 0.8839, + "step": 860 + }, + { + "epoch": 0.25, + "learning_rate": 4.8151914347054776e-05, + "loss": 0.8536, + "step": 870 + }, + { + "epoch": 0.25, + "learning_rate": 4.810973214289724e-05, + "loss": 0.8765, + "step": 880 + }, + { + "epoch": 0.25, + "learning_rate": 4.806709285838031e-05, + "loss": 0.8726, + "step": 890 + }, + { + "epoch": 0.25, + "learning_rate": 4.8023997336853434e-05, + "loss": 0.8664, + "step": 900 + }, + { + "epoch": 0.26, + "learning_rate": 4.7980446430689804e-05, + "loss": 0.8805, + "step": 910 + }, + { + "epoch": 0.26, + "learning_rate": 4.793644100126954e-05, + "loss": 0.878, + "step": 920 + }, + { + "epoch": 0.26, + "learning_rate": 4.7891981918962656e-05, + "loss": 0.8632, + "step": 930 + }, + { + "epoch": 0.27, + "learning_rate": 4.784707006311179e-05, + "loss": 0.8614, + "step": 940 + }, + { + "epoch": 0.27, + "learning_rate": 4.780170632201487e-05, + "loss": 0.8629, + "step": 950 + }, + { + "epoch": 0.27, + "learning_rate": 4.7755891592907556e-05, + "loss": 0.8635, + "step": 960 + }, + { + "epoch": 0.27, + "learning_rate": 4.7709626781945397e-05, + "loss": 0.8525, + "step": 970 + }, + { + "epoch": 0.28, + "learning_rate": 4.766291280418603e-05, + "loss": 0.8592, + "step": 980 + }, + { + "epoch": 0.28, + "learning_rate": 4.761575058357101e-05, + "loss": 0.8621, + "step": 990 + }, + { + "epoch": 0.28, + "learning_rate": 4.756814105290753e-05, + "loss": 0.8687, + "step": 1000 + }, + { + "epoch": 0.29, + "learning_rate": 4.7520085153850014e-05, + "loss": 0.8524, + "step": 1010 + }, + { + "epoch": 0.29, + "learning_rate": 4.7471583836881476e-05, + "loss": 0.8687, + "step": 1020 + }, + { + "epoch": 0.29, + "learning_rate": 4.742263806129469e-05, + "loss": 0.8505, + "step": 1030 + }, + { + "epoch": 0.29, + "learning_rate": 4.737324879517326e-05, + "loss": 0.8754, + "step": 1040 + }, + { + "epoch": 0.3, + "learning_rate": 4.732341701537245e-05, + "loss": 0.8583, + "step": 1050 + }, + { + "epoch": 0.3, + "learning_rate": 4.727314370749988e-05, + "loss": 0.8698, + "step": 1060 + }, + { + "epoch": 0.3, + "learning_rate": 4.7222429865896e-05, + "loss": 0.8661, + "step": 1070 + }, + { + "epoch": 0.31, + "learning_rate": 4.717127649361444e-05, + "loss": 0.8574, + "step": 1080 + }, + { + "epoch": 0.31, + "learning_rate": 4.71196846024022e-05, + "loss": 0.852, + "step": 1090 + }, + { + "epoch": 0.31, + "learning_rate": 4.7067655212679585e-05, + "loss": 0.8619, + "step": 1100 + }, + { + "epoch": 0.31, + "learning_rate": 4.701518935352006e-05, + "loss": 0.8632, + "step": 1110 + }, + { + "epoch": 0.32, + "learning_rate": 4.69622880626299e-05, + "loss": 0.8529, + "step": 1120 + }, + { + "epoch": 0.32, + "learning_rate": 4.690895238632762e-05, + "loss": 0.8529, + "step": 1130 + }, + { + "epoch": 0.32, + "learning_rate": 4.685518337952335e-05, + "loss": 0.8465, + "step": 1140 + }, + { + "epoch": 0.33, + "learning_rate": 4.680098210569789e-05, + "loss": 0.8604, + "step": 1150 + }, + { + "epoch": 0.33, + "learning_rate": 4.674634963688177e-05, + "loss": 0.8649, + "step": 1160 + }, + { + "epoch": 0.33, + "learning_rate": 4.669128705363394e-05, + "loss": 0.8572, + "step": 1170 + }, + { + "epoch": 0.33, + "learning_rate": 4.663579544502049e-05, + "loss": 0.8634, + "step": 1180 + }, + { + "epoch": 0.34, + "learning_rate": 4.657987590859305e-05, + "loss": 0.8478, + "step": 1190 + }, + { + "epoch": 0.34, + "learning_rate": 4.652352955036713e-05, + "loss": 0.8475, + "step": 1200 + }, + { + "epoch": 0.34, + "learning_rate": 4.646675748480019e-05, + "loss": 0.8537, + "step": 1210 + }, + { + "epoch": 0.35, + "learning_rate": 4.640956083476964e-05, + "loss": 0.8499, + "step": 1220 + }, + { + "epoch": 0.35, + "learning_rate": 4.635194073155061e-05, + "loss": 0.8467, + "step": 1230 + }, + { + "epoch": 0.35, + "learning_rate": 4.62938983147936e-05, + "loss": 0.8538, + "step": 1240 + }, + { + "epoch": 0.35, + "learning_rate": 4.62354347325019e-05, + "loss": 0.8619, + "step": 1250 + }, + { + "epoch": 0.36, + "learning_rate": 4.6176551141008916e-05, + "loss": 0.8593, + "step": 1260 + }, + { + "epoch": 0.36, + "learning_rate": 4.611724870495528e-05, + "loss": 0.8484, + "step": 1270 + }, + { + "epoch": 0.36, + "learning_rate": 4.605752859726583e-05, + "loss": 0.8395, + "step": 1280 + }, + { + "epoch": 0.37, + "learning_rate": 4.5997391999126397e-05, + "loss": 0.8547, + "step": 1290 + }, + { + "epoch": 0.37, + "learning_rate": 4.5936840099960465e-05, + "loss": 0.8586, + "step": 1300 + }, + { + "epoch": 0.37, + "learning_rate": 4.587587409740561e-05, + "loss": 0.839, + "step": 1310 + }, + { + "epoch": 0.37, + "learning_rate": 4.581449519728986e-05, + "loss": 0.8417, + "step": 1320 + }, + { + "epoch": 0.38, + "learning_rate": 4.575270461360779e-05, + "loss": 0.8404, + "step": 1330 + }, + { + "epoch": 0.38, + "learning_rate": 4.569050356849655e-05, + "loss": 0.843, + "step": 1340 + }, + { + "epoch": 0.38, + "learning_rate": 4.562789329221169e-05, + "loss": 0.8557, + "step": 1350 + }, + { + "epoch": 0.39, + "learning_rate": 4.5564875023102796e-05, + "loss": 0.8504, + "step": 1360 + }, + { + "epoch": 0.39, + "learning_rate": 4.550145000758905e-05, + "loss": 0.8579, + "step": 1370 + }, + { + "epoch": 0.39, + "learning_rate": 4.543761950013453e-05, + "loss": 0.8563, + "step": 1380 + }, + { + "epoch": 0.39, + "learning_rate": 4.537338476322341e-05, + "loss": 0.8446, + "step": 1390 + }, + { + "epoch": 0.4, + "learning_rate": 4.530874706733502e-05, + "loss": 0.8524, + "step": 1400 + }, + { + "epoch": 0.4, + "learning_rate": 4.524370769091866e-05, + "loss": 0.8417, + "step": 1410 + }, + { + "epoch": 0.4, + "learning_rate": 4.5178267920368366e-05, + "loss": 0.8582, + "step": 1420 + }, + { + "epoch": 0.4, + "learning_rate": 4.511242904999746e-05, + "loss": 0.841, + "step": 1430 + }, + { + "epoch": 0.41, + "learning_rate": 4.50461923820129e-05, + "loss": 0.8529, + "step": 1440 + }, + { + "epoch": 0.41, + "learning_rate": 4.497955922648961e-05, + "loss": 0.8545, + "step": 1450 + }, + { + "epoch": 0.41, + "learning_rate": 4.491253090134447e-05, + "loss": 0.8471, + "step": 1460 + }, + { + "epoch": 0.42, + "learning_rate": 4.4845108732310355e-05, + "loss": 0.8379, + "step": 1470 + }, + { + "epoch": 0.42, + "learning_rate": 4.4777294052909804e-05, + "loss": 0.8542, + "step": 1480 + }, + { + "epoch": 0.42, + "learning_rate": 4.470908820442873e-05, + "loss": 0.8463, + "step": 1490 + }, + { + "epoch": 0.42, + "learning_rate": 4.464049253588985e-05, + "loss": 0.8362, + "step": 1500 + }, + { + "epoch": 0.43, + "learning_rate": 4.457150840402604e-05, + "loss": 0.8467, + "step": 1510 + }, + { + "epoch": 0.43, + "learning_rate": 4.450213717325343e-05, + "loss": 0.8501, + "step": 1520 + }, + { + "epoch": 0.43, + "learning_rate": 4.443238021564448e-05, + "loss": 0.8541, + "step": 1530 + }, + { + "epoch": 0.44, + "learning_rate": 4.4362238910900835e-05, + "loss": 0.8443, + "step": 1540 + }, + { + "epoch": 0.44, + "learning_rate": 4.4291714646326024e-05, + "loss": 0.8297, + "step": 1550 + }, + { + "epoch": 0.44, + "learning_rate": 4.4220808816797995e-05, + "loss": 0.8532, + "step": 1560 + }, + { + "epoch": 0.44, + "learning_rate": 4.414952282474158e-05, + "loss": 0.854, + "step": 1570 + }, + { + "epoch": 0.45, + "learning_rate": 4.407785808010073e-05, + "loss": 0.849, + "step": 1580 + }, + { + "epoch": 0.45, + "learning_rate": 4.400581600031062e-05, + "loss": 0.8516, + "step": 1590 + }, + { + "epoch": 0.45, + "learning_rate": 4.3933398010269614e-05, + "loss": 0.8394, + "step": 1600 + }, + { + "epoch": 0.46, + "learning_rate": 4.386060554231111e-05, + "loss": 0.8399, + "step": 1610 + }, + { + "epoch": 0.46, + "learning_rate": 4.378744003617517e-05, + "loss": 0.8242, + "step": 1620 + }, + { + "epoch": 0.46, + "learning_rate": 4.371390293898007e-05, + "loss": 0.8395, + "step": 1630 + }, + { + "epoch": 0.46, + "learning_rate": 4.3639995705193684e-05, + "loss": 0.8355, + "step": 1640 + }, + { + "epoch": 0.47, + "learning_rate": 4.3565719796604706e-05, + "loss": 0.8299, + "step": 1650 + }, + { + "epoch": 0.47, + "learning_rate": 4.3491076682293715e-05, + "loss": 0.8272, + "step": 1660 + }, + { + "epoch": 0.47, + "learning_rate": 4.341606783860416e-05, + "loss": 0.8336, + "step": 1670 + }, + { + "epoch": 0.48, + "learning_rate": 4.334069474911313e-05, + "loss": 0.8264, + "step": 1680 + }, + { + "epoch": 0.48, + "learning_rate": 4.326495890460204e-05, + "loss": 0.8381, + "step": 1690 + }, + { + "epoch": 0.48, + "learning_rate": 4.3188861803027094e-05, + "loss": 0.8278, + "step": 1700 + }, + { + "epoch": 0.48, + "learning_rate": 4.3112404949489715e-05, + "loss": 0.8458, + "step": 1710 + }, + { + "epoch": 0.49, + "learning_rate": 4.303558985620673e-05, + "loss": 0.8348, + "step": 1720 + }, + { + "epoch": 0.49, + "learning_rate": 4.2958418042480506e-05, + "loss": 0.814, + "step": 1730 + }, + { + "epoch": 0.49, + "learning_rate": 4.288089103466886e-05, + "loss": 0.838, + "step": 1740 + }, + { + "epoch": 0.5, + "learning_rate": 4.280301036615489e-05, + "loss": 0.824, + "step": 1750 + }, + { + "epoch": 0.5, + "learning_rate": 4.272477757731662e-05, + "loss": 0.8314, + "step": 1760 + }, + { + "epoch": 0.5, + "learning_rate": 4.2646194215496595e-05, + "loss": 0.821, + "step": 1770 + }, + { + "epoch": 0.5, + "learning_rate": 4.2567261834971206e-05, + "loss": 0.8311, + "step": 1780 + }, + { + "epoch": 0.51, + "learning_rate": 4.248798199691998e-05, + "loss": 0.8443, + "step": 1790 + }, + { + "epoch": 0.51, + "learning_rate": 4.2408356269394714e-05, + "loss": 0.8315, + "step": 1800 + }, + { + "epoch": 0.51, + "learning_rate": 4.2328386227288445e-05, + "loss": 0.8184, + "step": 1810 + }, + { + "epoch": 0.52, + "learning_rate": 4.224807345230429e-05, + "loss": 0.8364, + "step": 1820 + }, + { + "epoch": 0.52, + "learning_rate": 4.21674195329242e-05, + "loss": 0.8186, + "step": 1830 + }, + { + "epoch": 0.52, + "learning_rate": 4.208642606437748e-05, + "loss": 0.8454, + "step": 1840 + }, + { + "epoch": 0.52, + "learning_rate": 4.2005094648609325e-05, + "loss": 0.832, + "step": 1850 + }, + { + "epoch": 0.53, + "learning_rate": 4.192342689424903e-05, + "loss": 0.8027, + "step": 1860 + }, + { + "epoch": 0.53, + "learning_rate": 4.184142441657827e-05, + "loss": 0.8365, + "step": 1870 + }, + { + "epoch": 0.53, + "learning_rate": 4.1759088837499095e-05, + "loss": 0.8523, + "step": 1880 + }, + { + "epoch": 0.54, + "learning_rate": 4.167642178550186e-05, + "loss": 0.8377, + "step": 1890 + }, + { + "epoch": 0.54, + "learning_rate": 4.159342489563304e-05, + "loss": 0.8299, + "step": 1900 + }, + { + "epoch": 0.54, + "learning_rate": 4.151009980946287e-05, + "loss": 0.8273, + "step": 1910 + }, + { + "epoch": 0.54, + "learning_rate": 4.142644817505284e-05, + "loss": 0.813, + "step": 1920 + }, + { + "epoch": 0.55, + "learning_rate": 4.1342471646923196e-05, + "loss": 0.8262, + "step": 1930 + }, + { + "epoch": 0.55, + "learning_rate": 4.1258171886020124e-05, + "loss": 0.8258, + "step": 1940 + }, + { + "epoch": 0.55, + "learning_rate": 4.117355055968295e-05, + "loss": 0.8248, + "step": 1950 + }, + { + "epoch": 0.55, + "learning_rate": 4.1088609341611135e-05, + "loss": 0.8123, + "step": 1960 + }, + { + "epoch": 0.56, + "learning_rate": 4.1003349911831166e-05, + "loss": 0.8304, + "step": 1970 + }, + { + "epoch": 0.56, + "learning_rate": 4.091777395666338e-05, + "loss": 0.849, + "step": 1980 + }, + { + "epoch": 0.56, + "learning_rate": 4.0831883168688534e-05, + "loss": 0.8255, + "step": 1990 + }, + { + "epoch": 0.57, + "learning_rate": 4.07456792467144e-05, + "loss": 0.8317, + "step": 2000 + }, + { + "epoch": 0.57, + "learning_rate": 4.065916389574211e-05, + "loss": 0.8331, + "step": 2010 + }, + { + "epoch": 0.57, + "learning_rate": 4.057233882693246e-05, + "loss": 0.8309, + "step": 2020 + }, + { + "epoch": 0.57, + "learning_rate": 4.048520575757207e-05, + "loss": 0.8117, + "step": 2030 + }, + { + "epoch": 0.58, + "learning_rate": 4.0397766411039395e-05, + "loss": 0.8155, + "step": 2040 + }, + { + "epoch": 0.58, + "learning_rate": 4.031002251677067e-05, + "loss": 0.8178, + "step": 2050 + }, + { + "epoch": 0.58, + "learning_rate": 4.022197581022567e-05, + "loss": 0.8155, + "step": 2060 + }, + { + "epoch": 0.59, + "learning_rate": 4.0133628032853435e-05, + "loss": 0.8273, + "step": 2070 + }, + { + "epoch": 0.59, + "learning_rate": 4.004498093205773e-05, + "loss": 0.8021, + "step": 2080 + }, + { + "epoch": 0.59, + "learning_rate": 3.99560362611626e-05, + "loss": 0.8374, + "step": 2090 + }, + { + "epoch": 0.59, + "learning_rate": 3.986679577937762e-05, + "loss": 0.8173, + "step": 2100 + }, + { + "epoch": 0.6, + "learning_rate": 3.9777261251763145e-05, + "loss": 0.8227, + "step": 2110 + }, + { + "epoch": 0.6, + "learning_rate": 3.9687434449195316e-05, + "loss": 0.8275, + "step": 2120 + }, + { + "epoch": 0.6, + "learning_rate": 3.959731714833115e-05, + "loss": 0.8226, + "step": 2130 + }, + { + "epoch": 0.61, + "learning_rate": 3.95069111315733e-05, + "loss": 0.815, + "step": 2140 + }, + { + "epoch": 0.61, + "learning_rate": 3.9416218187034876e-05, + "loss": 0.8306, + "step": 2150 + }, + { + "epoch": 0.61, + "learning_rate": 3.9325240108504016e-05, + "loss": 0.8424, + "step": 2160 + }, + { + "epoch": 0.61, + "learning_rate": 3.923397869540845e-05, + "loss": 0.8051, + "step": 2170 + }, + { + "epoch": 0.62, + "learning_rate": 3.91424357527799e-05, + "loss": 0.8117, + "step": 2180 + }, + { + "epoch": 0.62, + "learning_rate": 3.905061309121837e-05, + "loss": 0.8123, + "step": 2190 + }, + { + "epoch": 0.62, + "learning_rate": 3.895851252685634e-05, + "loss": 0.8038, + "step": 2200 + }, + { + "epoch": 0.63, + "learning_rate": 3.886613588132284e-05, + "loss": 0.8308, + "step": 2210 + }, + { + "epoch": 0.63, + "learning_rate": 3.877348498170743e-05, + "loss": 0.8187, + "step": 2220 + }, + { + "epoch": 0.63, + "learning_rate": 3.868056166052407e-05, + "loss": 0.8274, + "step": 2230 + }, + { + "epoch": 0.63, + "learning_rate": 3.858736775567484e-05, + "loss": 0.8171, + "step": 2240 + }, + { + "epoch": 0.64, + "learning_rate": 3.8493905110413626e-05, + "loss": 0.8213, + "step": 2250 + }, + { + "epoch": 0.64, + "learning_rate": 3.8400175573309646e-05, + "loss": 0.8241, + "step": 2260 + }, + { + "epoch": 0.64, + "learning_rate": 3.83061809982109e-05, + "loss": 0.8296, + "step": 2270 + }, + { + "epoch": 0.65, + "learning_rate": 3.821192324420747e-05, + "loss": 0.8247, + "step": 2280 + }, + { + "epoch": 0.65, + "learning_rate": 3.8117404175594795e-05, + "loss": 0.8399, + "step": 2290 + }, + { + "epoch": 0.65, + "learning_rate": 3.8022625661836775e-05, + "loss": 0.8015, + "step": 2300 + }, + { + "epoch": 0.65, + "learning_rate": 3.792758957752879e-05, + "loss": 0.8204, + "step": 2310 + }, + { + "epoch": 0.66, + "learning_rate": 3.783229780236062e-05, + "loss": 0.8198, + "step": 2320 + }, + { + "epoch": 0.66, + "learning_rate": 3.773675222107929e-05, + "loss": 0.8045, + "step": 2330 + }, + { + "epoch": 0.66, + "learning_rate": 3.7640954723451784e-05, + "loss": 0.8185, + "step": 2340 + }, + { + "epoch": 0.67, + "learning_rate": 3.7544907204227646e-05, + "loss": 0.8123, + "step": 2350 + }, + { + "epoch": 0.67, + "learning_rate": 3.7448611563101536e-05, + "loss": 0.8093, + "step": 2360 + }, + { + "epoch": 0.67, + "learning_rate": 3.735206970467564e-05, + "loss": 0.8194, + "step": 2370 + }, + { + "epoch": 0.67, + "learning_rate": 3.7255283538421984e-05, + "loss": 0.8121, + "step": 2380 + }, + { + "epoch": 0.68, + "learning_rate": 3.7158254978644703e-05, + "loss": 0.811, + "step": 2390 + }, + { + "epoch": 0.68, + "learning_rate": 3.706098594444216e-05, + "loss": 0.8013, + "step": 2400 + }, + { + "epoch": 0.68, + "learning_rate": 3.6963478359668966e-05, + "loss": 0.8215, + "step": 2410 + }, + { + "epoch": 0.69, + "learning_rate": 3.6865734152897987e-05, + "loss": 0.8079, + "step": 2420 + }, + { + "epoch": 0.69, + "learning_rate": 3.676775525738213e-05, + "loss": 0.821, + "step": 2430 + }, + { + "epoch": 0.69, + "learning_rate": 3.666954361101616e-05, + "loss": 0.8097, + "step": 2440 + }, + { + "epoch": 0.69, + "learning_rate": 3.657110115629832e-05, + "loss": 0.8046, + "step": 2450 + }, + { + "epoch": 0.7, + "learning_rate": 3.647242984029201e-05, + "loss": 0.8112, + "step": 2460 + }, + { + "epoch": 0.7, + "learning_rate": 3.637353161458713e-05, + "loss": 0.8099, + "step": 2470 + }, + { + "epoch": 0.7, + "learning_rate": 3.627440843526158e-05, + "loss": 0.8148, + "step": 2480 + }, + { + "epoch": 0.7, + "learning_rate": 3.6175062262842585e-05, + "loss": 0.8105, + "step": 2490 + }, + { + "epoch": 0.71, + "learning_rate": 3.607549506226784e-05, + "loss": 0.8132, + "step": 2500 + }, + { + "epoch": 0.71, + "learning_rate": 3.5975708802846725e-05, + "loss": 0.8149, + "step": 2510 + }, + { + "epoch": 0.71, + "learning_rate": 3.587570545822128e-05, + "loss": 0.8306, + "step": 2520 + }, + { + "epoch": 0.72, + "learning_rate": 3.5775487006327215e-05, + "loss": 0.8106, + "step": 2530 + }, + { + "epoch": 0.72, + "learning_rate": 3.567505542935482e-05, + "loss": 0.8192, + "step": 2540 + }, + { + "epoch": 0.72, + "learning_rate": 3.557441271370968e-05, + "loss": 0.8129, + "step": 2550 + }, + { + "epoch": 0.72, + "learning_rate": 3.547356084997344e-05, + "loss": 0.8155, + "step": 2560 + }, + { + "epoch": 0.73, + "learning_rate": 3.537250183286443e-05, + "loss": 0.8039, + "step": 2570 + }, + { + "epoch": 0.73, + "learning_rate": 3.527123766119818e-05, + "loss": 0.8109, + "step": 2580 + }, + { + "epoch": 0.73, + "learning_rate": 3.5169770337847935e-05, + "loss": 0.8063, + "step": 2590 + }, + { + "epoch": 0.74, + "learning_rate": 3.5068101869705004e-05, + "loss": 0.8275, + "step": 2600 + }, + { + "epoch": 0.74, + "learning_rate": 3.496623426763908e-05, + "loss": 0.8107, + "step": 2610 + }, + { + "epoch": 0.74, + "learning_rate": 3.486416954645846e-05, + "loss": 0.8047, + "step": 2620 + }, + { + "epoch": 0.74, + "learning_rate": 3.4761909724870205e-05, + "loss": 0.8123, + "step": 2630 + }, + { + "epoch": 0.75, + "learning_rate": 3.4659456825440216e-05, + "loss": 0.8241, + "step": 2640 + }, + { + "epoch": 0.75, + "learning_rate": 3.4556812874553204e-05, + "loss": 0.812, + "step": 2650 + }, + { + "epoch": 0.75, + "learning_rate": 3.445397990237264e-05, + "loss": 0.8161, + "step": 2660 + }, + { + "epoch": 0.76, + "learning_rate": 3.4350959942800584e-05, + "loss": 0.797, + "step": 2670 + }, + { + "epoch": 0.76, + "learning_rate": 3.424775503343747e-05, + "loss": 0.8155, + "step": 2680 + }, + { + "epoch": 0.76, + "learning_rate": 3.414436721554179e-05, + "loss": 0.797, + "step": 2690 + }, + { + "epoch": 0.76, + "learning_rate": 3.4040798533989745e-05, + "loss": 0.8153, + "step": 2700 + }, + { + "epoch": 0.77, + "learning_rate": 3.3937051037234745e-05, + "loss": 0.8016, + "step": 2710 + }, + { + "epoch": 0.77, + "learning_rate": 3.3833126777266974e-05, + "loss": 0.8138, + "step": 2720 + }, + { + "epoch": 0.77, + "learning_rate": 3.3729027809572735e-05, + "loss": 0.8178, + "step": 2730 + }, + { + "epoch": 0.78, + "learning_rate": 3.3624756193093835e-05, + "loss": 0.8062, + "step": 2740 + }, + { + "epoch": 0.78, + "learning_rate": 3.3520313990186856e-05, + "loss": 0.8101, + "step": 2750 + }, + { + "epoch": 0.78, + "learning_rate": 3.341570326658232e-05, + "loss": 0.7982, + "step": 2760 + }, + { + "epoch": 0.78, + "learning_rate": 3.331092609134392e-05, + "loss": 0.8021, + "step": 2770 + }, + { + "epoch": 0.79, + "learning_rate": 3.32059845368275e-05, + "loss": 0.817, + "step": 2780 + }, + { + "epoch": 0.79, + "learning_rate": 3.310088067864015e-05, + "loss": 0.8083, + "step": 2790 + }, + { + "epoch": 0.79, + "learning_rate": 3.299561659559909e-05, + "loss": 0.8047, + "step": 2800 + }, + { + "epoch": 0.8, + "learning_rate": 3.289019436969057e-05, + "loss": 0.8, + "step": 2810 + }, + { + "epoch": 0.8, + "learning_rate": 3.278461608602873e-05, + "loss": 0.8063, + "step": 2820 + }, + { + "epoch": 0.8, + "learning_rate": 3.267888383281431e-05, + "loss": 0.8139, + "step": 2830 + }, + { + "epoch": 0.8, + "learning_rate": 3.257299970129336e-05, + "loss": 0.8075, + "step": 2840 + }, + { + "epoch": 0.81, + "learning_rate": 3.246696578571592e-05, + "loss": 0.8056, + "step": 2850 + }, + { + "epoch": 0.81, + "learning_rate": 3.236078418329452e-05, + "loss": 0.8242, + "step": 2860 + }, + { + "epoch": 0.81, + "learning_rate": 3.225445699416276e-05, + "loss": 0.8041, + "step": 2870 + }, + { + "epoch": 0.82, + "learning_rate": 3.214798632133376e-05, + "loss": 0.8088, + "step": 2880 + }, + { + "epoch": 0.82, + "learning_rate": 3.204137427065857e-05, + "loss": 0.8121, + "step": 2890 + }, + { + "epoch": 0.82, + "learning_rate": 3.193462295078448e-05, + "loss": 0.8151, + "step": 2900 + }, + { + "epoch": 0.82, + "learning_rate": 3.1827734473113356e-05, + "loss": 0.8064, + "step": 2910 + }, + { + "epoch": 0.83, + "learning_rate": 3.172071095175989e-05, + "loss": 0.8151, + "step": 2920 + }, + { + "epoch": 0.83, + "learning_rate": 3.1613554503509715e-05, + "loss": 0.7942, + "step": 2930 + }, + { + "epoch": 0.83, + "learning_rate": 3.1506267247777645e-05, + "loss": 0.8131, + "step": 2940 + }, + { + "epoch": 0.84, + "learning_rate": 3.139885130656563e-05, + "loss": 0.8015, + "step": 2950 + }, + { + "epoch": 0.84, + "learning_rate": 3.129130880442091e-05, + "loss": 0.8053, + "step": 2960 + }, + { + "epoch": 0.84, + "learning_rate": 3.118364186839389e-05, + "loss": 0.7986, + "step": 2970 + }, + { + "epoch": 0.84, + "learning_rate": 3.107585262799613e-05, + "loss": 0.7936, + "step": 2980 + }, + { + "epoch": 0.85, + "learning_rate": 3.096794321515823e-05, + "loss": 0.8235, + "step": 2990 + }, + { + "epoch": 0.85, + "learning_rate": 3.0859915764187616e-05, + "loss": 0.8083, + "step": 3000 + }, + { + "epoch": 0.85, + "learning_rate": 3.075177241172637e-05, + "loss": 0.8081, + "step": 3010 + }, + { + "epoch": 0.86, + "learning_rate": 3.064351529670895e-05, + "loss": 0.7981, + "step": 3020 + }, + { + "epoch": 0.86, + "learning_rate": 3.0535146560319895e-05, + "loss": 0.8152, + "step": 3030 + }, + { + "epoch": 0.86, + "learning_rate": 3.0426668345951448e-05, + "loss": 0.8091, + "step": 3040 + }, + { + "epoch": 0.86, + "learning_rate": 3.031808279916121e-05, + "loss": 0.8206, + "step": 3050 + }, + { + "epoch": 0.87, + "learning_rate": 3.0209392067629676e-05, + "loss": 0.7947, + "step": 3060 + }, + { + "epoch": 0.87, + "learning_rate": 3.010059830111773e-05, + "loss": 0.8116, + "step": 3070 + }, + { + "epoch": 0.87, + "learning_rate": 2.9991703651424184e-05, + "loss": 0.8135, + "step": 3080 + }, + { + "epoch": 0.87, + "learning_rate": 2.988271027234317e-05, + "loss": 0.8032, + "step": 3090 + }, + { + "epoch": 0.88, + "learning_rate": 2.977362031962158e-05, + "loss": 0.8023, + "step": 3100 + }, + { + "epoch": 0.88, + "learning_rate": 2.966443595091637e-05, + "loss": 0.8116, + "step": 3110 + }, + { + "epoch": 0.88, + "learning_rate": 2.9555159325751947e-05, + "loss": 0.8048, + "step": 3120 + }, + { + "epoch": 0.89, + "learning_rate": 2.9445792605477433e-05, + "loss": 0.8032, + "step": 3130 + }, + { + "epoch": 0.89, + "learning_rate": 2.933633795322391e-05, + "loss": 0.808, + "step": 3140 + }, + { + "epoch": 0.89, + "learning_rate": 2.9226797533861615e-05, + "loss": 0.8057, + "step": 3150 + }, + { + "epoch": 0.89, + "learning_rate": 2.9117173513957186e-05, + "loss": 0.8013, + "step": 3160 + }, + { + "epoch": 0.9, + "learning_rate": 2.900746806173074e-05, + "loss": 0.802, + "step": 3170 + }, + { + "epoch": 0.9, + "learning_rate": 2.889768334701305e-05, + "loss": 0.804, + "step": 3180 + }, + { + "epoch": 0.9, + "learning_rate": 2.8787821541202564e-05, + "loss": 0.8, + "step": 3190 + }, + { + "epoch": 0.91, + "learning_rate": 2.8677884817222505e-05, + "loss": 0.7983, + "step": 3200 + }, + { + "epoch": 0.91, + "learning_rate": 2.856787534947789e-05, + "loss": 0.8083, + "step": 3210 + }, + { + "epoch": 0.91, + "learning_rate": 2.8457795313812507e-05, + "loss": 0.8203, + "step": 3220 + }, + { + "epoch": 0.91, + "learning_rate": 2.8347646887465867e-05, + "loss": 0.792, + "step": 3230 + }, + { + "epoch": 0.92, + "learning_rate": 2.8237432249030183e-05, + "loss": 0.8006, + "step": 3240 + }, + { + "epoch": 0.92, + "learning_rate": 2.812715357840725e-05, + "loss": 0.7953, + "step": 3250 + }, + { + "epoch": 0.92, + "learning_rate": 2.801681305676534e-05, + "loss": 0.8057, + "step": 3260 + }, + { + "epoch": 0.93, + "learning_rate": 2.7906412866496034e-05, + "loss": 0.8005, + "step": 3270 + }, + { + "epoch": 0.93, + "learning_rate": 2.7795955191171114e-05, + "loss": 0.8082, + "step": 3280 + }, + { + "epoch": 0.93, + "learning_rate": 2.7685442215499323e-05, + "loss": 0.811, + "step": 3290 + }, + { + "epoch": 0.93, + "learning_rate": 2.7574876125283176e-05, + "loss": 0.7981, + "step": 3300 + }, + { + "epoch": 0.94, + "learning_rate": 2.7464259107375722e-05, + "loss": 0.8018, + "step": 3310 + }, + { + "epoch": 0.94, + "learning_rate": 2.7353593349637297e-05, + "loss": 0.7991, + "step": 3320 + }, + { + "epoch": 0.94, + "learning_rate": 2.7242881040892255e-05, + "loss": 0.8057, + "step": 3330 + }, + { + "epoch": 0.95, + "learning_rate": 2.713212437088564e-05, + "loss": 0.8156, + "step": 3340 + }, + { + "epoch": 0.95, + "learning_rate": 2.702132553023993e-05, + "loss": 0.8003, + "step": 3350 + }, + { + "epoch": 0.95, + "learning_rate": 2.691048671041169e-05, + "loss": 0.7976, + "step": 3360 + }, + { + "epoch": 0.95, + "learning_rate": 2.6799610103648197e-05, + "loss": 0.7894, + "step": 3370 + }, + { + "epoch": 0.96, + "learning_rate": 2.668869790294411e-05, + "loss": 0.7953, + "step": 3380 + }, + { + "epoch": 0.96, + "learning_rate": 2.6577752301998098e-05, + "loss": 0.8124, + "step": 3390 + }, + { + "epoch": 0.96, + "learning_rate": 2.6466775495169437e-05, + "loss": 0.8073, + "step": 3400 + }, + { + "epoch": 0.97, + "learning_rate": 2.6355769677434628e-05, + "loss": 0.7979, + "step": 3410 + }, + { + "epoch": 0.97, + "learning_rate": 2.6244737044343954e-05, + "loss": 0.8023, + "step": 3420 + }, + { + "epoch": 0.97, + "learning_rate": 2.6133679791978065e-05, + "loss": 0.8046, + "step": 3430 + }, + { + "epoch": 0.97, + "learning_rate": 2.602260011690457e-05, + "loss": 0.8082, + "step": 3440 + }, + { + "epoch": 0.98, + "learning_rate": 2.591150021613456e-05, + "loss": 0.7868, + "step": 3450 + }, + { + "epoch": 0.98, + "learning_rate": 2.580038228707916e-05, + "loss": 0.7938, + "step": 3460 + }, + { + "epoch": 0.98, + "learning_rate": 2.568924852750607e-05, + "loss": 0.8215, + "step": 3470 + }, + { + "epoch": 0.99, + "learning_rate": 2.55781011354961e-05, + "loss": 0.807, + "step": 3480 + }, + { + "epoch": 0.99, + "learning_rate": 2.5466942309399706e-05, + "loss": 0.7878, + "step": 3490 + }, + { + "epoch": 0.99, + "learning_rate": 2.535577424779347e-05, + "loss": 0.7968, + "step": 3500 + }, + { + "epoch": 0.99, + "learning_rate": 2.5244599149436642e-05, + "loss": 0.787, + "step": 3510 + }, + { + "epoch": 1.0, + "learning_rate": 2.5133419213227684e-05, + "loss": 0.8011, + "step": 3520 + }, + { + "epoch": 1.0, + "learning_rate": 2.5022236638160712e-05, + "loss": 0.8086, + "step": 3530 + }, + { + "epoch": 1.0, + "learning_rate": 2.491105362328204e-05, + "loss": 0.8125, + "step": 3540 + }, + { + "epoch": 1.01, + "learning_rate": 2.4799872367646685e-05, + "loss": 0.8125, + "step": 3550 + }, + { + "epoch": 1.01, + "learning_rate": 2.468869507027486e-05, + "loss": 0.7805, + "step": 3560 + }, + { + "epoch": 1.01, + "learning_rate": 2.457752393010851e-05, + "loss": 0.817, + "step": 3570 + }, + { + "epoch": 1.01, + "learning_rate": 2.4466361145967782e-05, + "loss": 0.8056, + "step": 3580 + }, + { + "epoch": 1.02, + "learning_rate": 2.4355208916507554e-05, + "loss": 0.7752, + "step": 3590 + }, + { + "epoch": 1.02, + "learning_rate": 2.4244069440173938e-05, + "loss": 0.7749, + "step": 3600 + }, + { + "epoch": 1.02, + "learning_rate": 2.413294491516083e-05, + "loss": 0.8073, + "step": 3610 + }, + { + "epoch": 1.02, + "learning_rate": 2.402183753936639e-05, + "loss": 0.8117, + "step": 3620 + }, + { + "epoch": 1.03, + "learning_rate": 2.3910749510349574e-05, + "loss": 0.8008, + "step": 3630 + }, + { + "epoch": 1.03, + "learning_rate": 2.3799683025286727e-05, + "loss": 0.8028, + "step": 3640 + }, + { + "epoch": 1.03, + "learning_rate": 2.3688640280928043e-05, + "loss": 0.7974, + "step": 3650 + }, + { + "epoch": 1.04, + "learning_rate": 2.357762347355418e-05, + "loss": 0.7867, + "step": 3660 + }, + { + "epoch": 1.04, + "learning_rate": 2.346663479893277e-05, + "loss": 0.8002, + "step": 3670 + }, + { + "epoch": 1.04, + "learning_rate": 2.3355676452275057e-05, + "loss": 0.8095, + "step": 3680 + }, + { + "epoch": 1.04, + "learning_rate": 2.3244750628192395e-05, + "loss": 0.7847, + "step": 3690 + }, + { + "epoch": 1.05, + "learning_rate": 2.313385952065291e-05, + "loss": 0.7693, + "step": 3700 + }, + { + "epoch": 1.05, + "learning_rate": 2.302300532293806e-05, + "loss": 0.8078, + "step": 3710 + }, + { + "epoch": 1.05, + "learning_rate": 2.2912190227599305e-05, + "loss": 0.7925, + "step": 3720 + }, + { + "epoch": 1.06, + "learning_rate": 2.280141642641468e-05, + "loss": 0.77, + "step": 3730 + }, + { + "epoch": 1.06, + "learning_rate": 2.26906861103455e-05, + "loss": 0.7962, + "step": 3740 + }, + { + "epoch": 1.06, + "learning_rate": 2.2580001469492968e-05, + "loss": 0.8014, + "step": 3750 + }, + { + "epoch": 1.06, + "learning_rate": 2.2469364693054938e-05, + "loss": 0.7934, + "step": 3760 + }, + { + "epoch": 1.07, + "learning_rate": 2.235877796928252e-05, + "loss": 0.7978, + "step": 3770 + }, + { + "epoch": 1.07, + "learning_rate": 2.2248243485436892e-05, + "loss": 0.8022, + "step": 3780 + }, + { + "epoch": 1.07, + "learning_rate": 2.213776342774595e-05, + "loss": 0.7934, + "step": 3790 + }, + { + "epoch": 1.08, + "learning_rate": 2.2027339981361156e-05, + "loss": 0.7975, + "step": 3800 + }, + { + "epoch": 1.08, + "learning_rate": 2.1916975330314235e-05, + "loss": 0.807, + "step": 3810 + }, + { + "epoch": 1.08, + "learning_rate": 2.1806671657474048e-05, + "loss": 0.7754, + "step": 3820 + }, + { + "epoch": 1.08, + "learning_rate": 2.1696431144503356e-05, + "loss": 0.7977, + "step": 3830 + }, + { + "epoch": 1.09, + "learning_rate": 2.1586255971815738e-05, + "loss": 0.7922, + "step": 3840 + }, + { + "epoch": 1.09, + "learning_rate": 2.147614831853239e-05, + "loss": 0.7862, + "step": 3850 + }, + { + "epoch": 1.09, + "learning_rate": 2.136611036243908e-05, + "loss": 0.7918, + "step": 3860 + }, + { + "epoch": 1.1, + "learning_rate": 2.1256144279943066e-05, + "loss": 0.781, + "step": 3870 + }, + { + "epoch": 1.1, + "learning_rate": 2.114625224603002e-05, + "loss": 0.7786, + "step": 3880 + }, + { + "epoch": 1.1, + "learning_rate": 2.1036436434221048e-05, + "loss": 0.8067, + "step": 3890 + }, + { + "epoch": 1.1, + "learning_rate": 2.0926699016529656e-05, + "loss": 0.7755, + "step": 3900 + }, + { + "epoch": 1.11, + "learning_rate": 2.0817042163418858e-05, + "loss": 0.7958, + "step": 3910 + }, + { + "epoch": 1.11, + "learning_rate": 2.0707468043758156e-05, + "loss": 0.8064, + "step": 3920 + }, + { + "epoch": 1.11, + "learning_rate": 2.059797882478074e-05, + "loss": 0.7967, + "step": 3930 + }, + { + "epoch": 1.12, + "learning_rate": 2.048857667204053e-05, + "loss": 0.8107, + "step": 3940 + }, + { + "epoch": 1.12, + "learning_rate": 2.0379263749369434e-05, + "loss": 0.7857, + "step": 3950 + }, + { + "epoch": 1.12, + "learning_rate": 2.027004221883447e-05, + "loss": 0.7732, + "step": 3960 + }, + { + "epoch": 1.12, + "learning_rate": 2.016091424069506e-05, + "loss": 0.7768, + "step": 3970 + }, + { + "epoch": 1.13, + "learning_rate": 2.0051881973360266e-05, + "loss": 0.7839, + "step": 3980 + }, + { + "epoch": 1.13, + "learning_rate": 1.9942947573346133e-05, + "loss": 0.7923, + "step": 3990 + }, + { + "epoch": 1.13, + "learning_rate": 1.9834113195233e-05, + "loss": 0.7994, + "step": 4000 + }, + { + "epoch": 1.14, + "learning_rate": 1.9725380991622923e-05, + "loss": 0.7907, + "step": 4010 + }, + { + "epoch": 1.14, + "learning_rate": 1.961675311309705e-05, + "loss": 0.7908, + "step": 4020 + }, + { + "epoch": 1.14, + "learning_rate": 1.9508231708173146e-05, + "loss": 0.7731, + "step": 4030 + }, + { + "epoch": 1.14, + "learning_rate": 1.9399818923263056e-05, + "loss": 0.7769, + "step": 4040 + }, + { + "epoch": 1.15, + "learning_rate": 1.929151690263026e-05, + "loss": 0.795, + "step": 4050 + }, + { + "epoch": 1.15, + "learning_rate": 1.918332778834745e-05, + "loss": 0.8147, + "step": 4060 + }, + { + "epoch": 1.15, + "learning_rate": 1.9075253720254217e-05, + "loss": 0.8065, + "step": 4070 + }, + { + "epoch": 1.16, + "learning_rate": 1.8967296835914643e-05, + "loss": 0.7879, + "step": 4080 + }, + { + "epoch": 1.16, + "learning_rate": 1.885945927057511e-05, + "loss": 0.7755, + "step": 4090 + }, + { + "epoch": 1.16, + "learning_rate": 1.8751743157122003e-05, + "loss": 0.7852, + "step": 4100 + }, + { + "epoch": 1.16, + "learning_rate": 1.8644150626039534e-05, + "loss": 0.7912, + "step": 4110 + }, + { + "epoch": 1.17, + "learning_rate": 1.8536683805367656e-05, + "loss": 0.7934, + "step": 4120 + }, + { + "epoch": 1.17, + "learning_rate": 1.8429344820659892e-05, + "loss": 0.7966, + "step": 4130 + }, + { + "epoch": 1.17, + "learning_rate": 1.832213579494137e-05, + "loss": 0.7976, + "step": 4140 + }, + { + "epoch": 1.17, + "learning_rate": 1.8215058848666765e-05, + "loss": 0.7843, + "step": 4150 + }, + { + "epoch": 1.18, + "learning_rate": 1.810811609967844e-05, + "loss": 0.7848, + "step": 4160 + }, + { + "epoch": 1.18, + "learning_rate": 1.8001309663164457e-05, + "loss": 0.7675, + "step": 4170 + }, + { + "epoch": 1.18, + "learning_rate": 1.7894641651616838e-05, + "loss": 0.8059, + "step": 4180 + }, + { + "epoch": 1.19, + "learning_rate": 1.7788114174789706e-05, + "loss": 0.7871, + "step": 4190 + }, + { + "epoch": 1.19, + "learning_rate": 1.7681729339657626e-05, + "loss": 0.776, + "step": 4200 + }, + { + "epoch": 1.19, + "learning_rate": 1.7575489250373867e-05, + "loss": 0.7911, + "step": 4210 + }, + { + "epoch": 1.19, + "learning_rate": 1.746939600822883e-05, + "loss": 0.7934, + "step": 4220 + }, + { + "epoch": 1.2, + "learning_rate": 1.7363451711608445e-05, + "loss": 0.7922, + "step": 4230 + }, + { + "epoch": 1.2, + "learning_rate": 1.7257658455952747e-05, + "loss": 0.7931, + "step": 4240 + }, + { + "epoch": 1.2, + "learning_rate": 1.715201833371432e-05, + "loss": 0.7926, + "step": 4250 + }, + { + "epoch": 1.21, + "learning_rate": 1.7046533434317008e-05, + "loss": 0.7881, + "step": 4260 + }, + { + "epoch": 1.21, + "learning_rate": 1.6941205844114522e-05, + "loss": 0.7842, + "step": 4270 + }, + { + "epoch": 1.21, + "learning_rate": 1.683603764634923e-05, + "loss": 0.7807, + "step": 4280 + }, + { + "epoch": 1.21, + "learning_rate": 1.6731030921110903e-05, + "loss": 0.7926, + "step": 4290 + }, + { + "epoch": 1.22, + "learning_rate": 1.6626187745295608e-05, + "loss": 0.7878, + "step": 4300 + }, + { + "epoch": 1.22, + "learning_rate": 1.65215101925646e-05, + "loss": 0.7843, + "step": 4310 + }, + { + "epoch": 1.22, + "learning_rate": 1.641700033330336e-05, + "loss": 0.7748, + "step": 4320 + }, + { + "epoch": 1.23, + "learning_rate": 1.6312660234580585e-05, + "loss": 0.802, + "step": 4330 + }, + { + "epoch": 1.23, + "learning_rate": 1.6208491960107324e-05, + "loss": 0.7864, + "step": 4340 + }, + { + "epoch": 1.23, + "learning_rate": 1.6104497570196193e-05, + "loss": 0.7884, + "step": 4350 + }, + { + "epoch": 1.23, + "learning_rate": 1.600067912172057e-05, + "loss": 0.7832, + "step": 4360 + }, + { + "epoch": 1.24, + "learning_rate": 1.5897038668073965e-05, + "loss": 0.8039, + "step": 4370 + }, + { + "epoch": 1.24, + "learning_rate": 1.5793578259129355e-05, + "loss": 0.7737, + "step": 4380 + }, + { + "epoch": 1.24, + "learning_rate": 1.5690299941198706e-05, + "loss": 0.7844, + "step": 4390 + }, + { + "epoch": 1.25, + "learning_rate": 1.558720575699242e-05, + "loss": 0.7865, + "step": 4400 + }, + { + "epoch": 1.25, + "learning_rate": 1.548429774557901e-05, + "loss": 0.7983, + "step": 4410 + }, + { + "epoch": 1.25, + "learning_rate": 1.5381577942344688e-05, + "loss": 0.7851, + "step": 4420 + }, + { + "epoch": 1.25, + "learning_rate": 1.5279048378953222e-05, + "loss": 0.7798, + "step": 4430 + }, + { + "epoch": 1.26, + "learning_rate": 1.517671108330561e-05, + "loss": 0.79, + "step": 4440 + }, + { + "epoch": 1.26, + "learning_rate": 1.5074568079500109e-05, + "loss": 0.7694, + "step": 4450 + }, + { + "epoch": 1.26, + "learning_rate": 1.497262138779208e-05, + "loss": 0.7874, + "step": 4460 + }, + { + "epoch": 1.27, + "learning_rate": 1.4870873024554138e-05, + "loss": 0.7878, + "step": 4470 + }, + { + "epoch": 1.27, + "learning_rate": 1.4769325002236183e-05, + "loss": 0.7992, + "step": 4480 + }, + { + "epoch": 1.27, + "learning_rate": 1.4667979329325651e-05, + "loss": 0.8003, + "step": 4490 + }, + { + "epoch": 1.27, + "learning_rate": 1.4566838010307754e-05, + "loss": 0.7778, + "step": 4500 + }, + { + "epoch": 1.28, + "learning_rate": 1.4465903045625878e-05, + "loss": 0.773, + "step": 4510 + }, + { + "epoch": 1.28, + "learning_rate": 1.4365176431641958e-05, + "loss": 0.7872, + "step": 4520 + }, + { + "epoch": 1.28, + "learning_rate": 1.4264660160597057e-05, + "loss": 0.7977, + "step": 4530 + }, + { + "epoch": 1.29, + "learning_rate": 1.41643562205719e-05, + "loss": 0.7792, + "step": 4540 + }, + { + "epoch": 1.29, + "learning_rate": 1.4064266595447584e-05, + "loss": 0.7792, + "step": 4550 + }, + { + "epoch": 1.29, + "learning_rate": 1.3964393264866368e-05, + "loss": 0.7836, + "step": 4560 + }, + { + "epoch": 1.29, + "learning_rate": 1.386473820419244e-05, + "loss": 0.8005, + "step": 4570 + }, + { + "epoch": 1.3, + "learning_rate": 1.376530338447294e-05, + "loss": 0.7937, + "step": 4580 + }, + { + "epoch": 1.3, + "learning_rate": 1.366609077239889e-05, + "loss": 0.7692, + "step": 4590 + }, + { + "epoch": 1.3, + "learning_rate": 1.3567102330266369e-05, + "loss": 0.7926, + "step": 4600 + }, + { + "epoch": 1.31, + "learning_rate": 1.3468340015937642e-05, + "loss": 0.7725, + "step": 4610 + }, + { + "epoch": 1.31, + "learning_rate": 1.3369805782802467e-05, + "loss": 0.7936, + "step": 4620 + }, + { + "epoch": 1.31, + "learning_rate": 1.3271501579739449e-05, + "loss": 0.7776, + "step": 4630 + }, + { + "epoch": 1.31, + "learning_rate": 1.317342935107752e-05, + "loss": 0.7785, + "step": 4640 + }, + { + "epoch": 1.32, + "learning_rate": 1.307559103655743e-05, + "loss": 0.7735, + "step": 4650 + }, + { + "epoch": 1.32, + "learning_rate": 1.2977988571293447e-05, + "loss": 0.7925, + "step": 4660 + }, + { + "epoch": 1.32, + "learning_rate": 1.288062388573501e-05, + "loss": 0.7846, + "step": 4670 + }, + { + "epoch": 1.33, + "learning_rate": 1.2783498905628622e-05, + "loss": 0.7782, + "step": 4680 + }, + { + "epoch": 1.33, + "learning_rate": 1.2696292959503922e-05, + "loss": 0.7888, + "step": 4690 + }, + { + "epoch": 1.33, + "learning_rate": 1.2599628708177253e-05, + "loss": 0.7898, + "step": 4700 + }, + { + "epoch": 1.33, + "learning_rate": 1.250320972002072e-05, + "loss": 0.7956, + "step": 4710 + }, + { + "epoch": 1.34, + "learning_rate": 1.2407037902076168e-05, + "loss": 0.7735, + "step": 4720 + }, + { + "epoch": 1.34, + "learning_rate": 1.23111151564967e-05, + "loss": 0.7842, + "step": 4730 + }, + { + "epoch": 1.34, + "learning_rate": 1.2215443380509125e-05, + "loss": 0.7892, + "step": 4740 + }, + { + "epoch": 1.34, + "learning_rate": 1.2120024466376381e-05, + "loss": 0.7822, + "step": 4750 + }, + { + "epoch": 1.35, + "learning_rate": 1.2024860301360131e-05, + "loss": 0.7788, + "step": 4760 + }, + { + "epoch": 1.35, + "learning_rate": 1.1929952767683426e-05, + "loss": 0.7824, + "step": 4770 + }, + { + "epoch": 1.35, + "learning_rate": 1.1835303742493508e-05, + "loss": 0.7859, + "step": 4780 + }, + { + "epoch": 1.36, + "learning_rate": 1.1740915097824629e-05, + "loss": 0.7897, + "step": 4790 + }, + { + "epoch": 1.36, + "learning_rate": 1.1646788700561085e-05, + "loss": 0.768, + "step": 4800 + }, + { + "epoch": 1.36, + "learning_rate": 1.1552926412400225e-05, + "loss": 0.7935, + "step": 4810 + }, + { + "epoch": 1.36, + "learning_rate": 1.1459330089815699e-05, + "loss": 0.7933, + "step": 4820 + }, + { + "epoch": 1.37, + "learning_rate": 1.136600158402068e-05, + "loss": 0.7792, + "step": 4830 + }, + { + "epoch": 1.37, + "learning_rate": 1.1272942740931286e-05, + "loss": 0.7839, + "step": 4840 + }, + { + "epoch": 1.37, + "learning_rate": 1.1180155401130044e-05, + "loss": 0.7844, + "step": 4850 + }, + { + "epoch": 1.38, + "learning_rate": 1.1087641399829527e-05, + "loss": 0.7753, + "step": 4860 + }, + { + "epoch": 1.38, + "learning_rate": 1.0995402566835997e-05, + "loss": 0.791, + "step": 4870 + }, + { + "epoch": 1.38, + "learning_rate": 1.090344072651328e-05, + "loss": 0.7998, + "step": 4880 + }, + { + "epoch": 1.38, + "learning_rate": 1.0811757697746614e-05, + "loss": 0.7864, + "step": 4890 + }, + { + "epoch": 1.39, + "learning_rate": 1.0720355293906741e-05, + "loss": 0.7702, + "step": 4900 + }, + { + "epoch": 1.39, + "learning_rate": 1.0629235322813982e-05, + "loss": 0.7705, + "step": 4910 + }, + { + "epoch": 1.39, + "learning_rate": 1.0538399586702507e-05, + "loss": 0.7941, + "step": 4920 + }, + { + "epoch": 1.4, + "learning_rate": 1.0447849882184715e-05, + "loss": 0.7779, + "step": 4930 + }, + { + "epoch": 1.4, + "learning_rate": 1.035758800021564e-05, + "loss": 0.7755, + "step": 4940 + }, + { + "epoch": 1.4, + "learning_rate": 1.0267615726057592e-05, + "loss": 0.7825, + "step": 4950 + }, + { + "epoch": 1.4, + "learning_rate": 1.0177934839244787e-05, + "loss": 0.7983, + "step": 4960 + }, + { + "epoch": 1.41, + "learning_rate": 1.0088547113548211e-05, + "loss": 0.773, + "step": 4970 + }, + { + "epoch": 1.41, + "learning_rate": 9.99945431694048e-06, + "loss": 0.7794, + "step": 4980 + }, + { + "epoch": 1.41, + "learning_rate": 9.910658211560902e-06, + "loss": 0.7889, + "step": 4990 + }, + { + "epoch": 1.42, + "learning_rate": 9.822160553680617e-06, + "loss": 0.7809, + "step": 5000 + } + ], + "max_steps": 7064, + "num_train_epochs": 2, + "total_flos": 1.7714547482983137e+19, + "trial_name": null, + "trial_params": null +} diff --git a/sft-lora/checkpoint-5000/training_args.bin b/sft-lora/checkpoint-5000/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..3eed0ff4867b1994122fd7acbeae2361d0d3b65f --- /dev/null +++ b/sft-lora/checkpoint-5000/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f9990bd8d9bf61dcf0d79a1a831b0934c6cc3a114d136458fc4cdd6dc2a9387 +size 3272 diff --git a/sft-lora/checkpoint-6000/README.md b/sft-lora/checkpoint-6000/README.md new file mode 100644 index 0000000000000000000000000000000000000000..d290c902d52b2091d490255d35c9be86df84f437 --- /dev/null +++ b/sft-lora/checkpoint-6000/README.md @@ -0,0 +1,3 @@ +--- +library_name: peft +--- diff --git a/sft-lora/checkpoint-6000/adapter_config.json b/sft-lora/checkpoint-6000/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..2ef4676864a7f782259cd6700dcab8059e8973ab --- /dev/null +++ b/sft-lora/checkpoint-6000/adapter_config.json @@ -0,0 +1,20 @@ +{ + "base_model_name_or_path": "llama-13b-hf/", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layers_pattern": null, + "layers_to_transform": null, + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "revision": null, + "target_modules": [ + "q_proj", + "v_proj" + ], + "task_type": "CAUSAL_LM" +} \ No newline at end of file diff --git a/sft-lora/checkpoint-6000/adapter_model.bin b/sft-lora/checkpoint-6000/adapter_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..6d46aadc78c7c7ca8f6923f8f10dd6798e040ba6 --- /dev/null +++ b/sft-lora/checkpoint-6000/adapter_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c17b1864e89b0353438dad19ae6c41b11337f863f9fd74bac552e9f7bc1923b0 +size 26269517 diff --git a/sft-lora/checkpoint-6000/finetuning_args.json b/sft-lora/checkpoint-6000/finetuning_args.json new file mode 100644 index 0000000000000000000000000000000000000000..36a921b3eb84159ad54e7697e9d7d3e2fde38fec --- /dev/null +++ b/sft-lora/checkpoint-6000/finetuning_args.json @@ -0,0 +1,13 @@ +{ + "finetuning_type": "lora", + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "lora_rank": 8, + "lora_target": [ + "q_proj", + "v_proj" + ], + "name_module_trainable": "mlp", + "num_hidden_layers": 32, + "num_layer_trainable": 3 +} diff --git a/sft-lora/checkpoint-6000/optimizer.pt b/sft-lora/checkpoint-6000/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..6dd7f7484139484cd99e24358deb5f5ef1c336ee --- /dev/null +++ b/sft-lora/checkpoint-6000/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aeca3bae2b629ac2b0240908e89b35166f0c6ae5d14c9b06a762d4e014589689 +size 52562821 diff --git a/sft-lora/checkpoint-6000/rng_state_0.pth b/sft-lora/checkpoint-6000/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..702d1d371cc01630d5c2e0eee505cb4a2f993d10 --- /dev/null +++ b/sft-lora/checkpoint-6000/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13b5afb582286dc1f513c8f1589e44203922864b0eecb5d968bb7e9bc87aa84e +size 18679 diff --git a/sft-lora/checkpoint-6000/rng_state_1.pth b/sft-lora/checkpoint-6000/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..e1828ae0358bc5852c545eb14cc1f0ba8cb5877a --- /dev/null +++ b/sft-lora/checkpoint-6000/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8746d399d43005a6447ab9d40f84e0907616385574832c925bbc169145ea806 +size 18679 diff --git a/sft-lora/checkpoint-6000/rng_state_2.pth b/sft-lora/checkpoint-6000/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..a100206e289a956c92746593dbf9efe0fc9a657a --- /dev/null +++ b/sft-lora/checkpoint-6000/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d416c799ff2ec4a2d6a8e09383202ff1c136b92ab323e2325bc9a0646fc5cfea +size 18679 diff --git a/sft-lora/checkpoint-6000/rng_state_3.pth b/sft-lora/checkpoint-6000/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..b72fb4b99f89e30566ac3f1140ae5beaaf61a996 --- /dev/null +++ b/sft-lora/checkpoint-6000/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f531295e2f7b930d3678382354c0c47ba5cd0e89c32f49834a21b093eebb41f +size 18679 diff --git a/sft-lora/checkpoint-6000/scheduler.pt b/sft-lora/checkpoint-6000/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e9d948db035cb0f2e76f4610472c18040b267de --- /dev/null +++ b/sft-lora/checkpoint-6000/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b5a2c2f656bea8a2d1ba7a2e6c21bfbd26810ddee16856c79cc08db9957bb27 +size 627 diff --git a/sft-lora/checkpoint-6000/trainer_state.json b/sft-lora/checkpoint-6000/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..bff64cec9be63e2cca64def5e506825570038d9b --- /dev/null +++ b/sft-lora/checkpoint-6000/trainer_state.json @@ -0,0 +1,3616 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 1.6987542468856174, + "global_step": 6000, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.0, + "learning_rate": 4.9999752766303955e-05, + "loss": 1.293, + "step": 10 + }, + { + "epoch": 0.01, + "learning_rate": 4.999901107010577e-05, + "loss": 1.2584, + "step": 20 + }, + { + "epoch": 0.01, + "learning_rate": 4.999777492607524e-05, + "loss": 1.2075, + "step": 30 + }, + { + "epoch": 0.01, + "learning_rate": 4.9996044358661676e-05, + "loss": 1.1718, + "step": 40 + }, + { + "epoch": 0.01, + "learning_rate": 4.9993819402093446e-05, + "loss": 1.1483, + "step": 50 + }, + { + "epoch": 0.02, + "learning_rate": 4.999110010037728e-05, + "loss": 1.122, + "step": 60 + }, + { + "epoch": 0.02, + "learning_rate": 4.998788650729743e-05, + "loss": 1.0971, + "step": 70 + }, + { + "epoch": 0.02, + "learning_rate": 4.998417868641457e-05, + "loss": 1.0756, + "step": 80 + }, + { + "epoch": 0.03, + "learning_rate": 4.9979976711064556e-05, + "loss": 1.0673, + "step": 90 + }, + { + "epoch": 0.03, + "learning_rate": 4.9975280664357e-05, + "loss": 1.0705, + "step": 100 + }, + { + "epoch": 0.03, + "learning_rate": 4.997009063917356e-05, + "loss": 1.0673, + "step": 110 + }, + { + "epoch": 0.03, + "learning_rate": 4.996440673816617e-05, + "loss": 1.031, + "step": 120 + }, + { + "epoch": 0.04, + "learning_rate": 4.995822907375498e-05, + "loss": 1.0383, + "step": 130 + }, + { + "epoch": 0.04, + "learning_rate": 4.9951557768126136e-05, + "loss": 1.0097, + "step": 140 + }, + { + "epoch": 0.04, + "learning_rate": 4.9944392953229365e-05, + "loss": 1.012, + "step": 150 + }, + { + "epoch": 0.05, + "learning_rate": 4.993673477077535e-05, + "loss": 0.9834, + "step": 160 + }, + { + "epoch": 0.05, + "learning_rate": 4.9928583372232954e-05, + "loss": 0.9908, + "step": 170 + }, + { + "epoch": 0.05, + "learning_rate": 4.991993891882622e-05, + "loss": 0.9908, + "step": 180 + }, + { + "epoch": 0.05, + "learning_rate": 4.991080158153115e-05, + "loss": 0.9913, + "step": 190 + }, + { + "epoch": 0.06, + "learning_rate": 4.990117154107236e-05, + "loss": 0.9782, + "step": 200 + }, + { + "epoch": 0.06, + "learning_rate": 4.989104898791949e-05, + "loss": 0.9954, + "step": 210 + }, + { + "epoch": 0.06, + "learning_rate": 4.988043412228343e-05, + "loss": 0.975, + "step": 220 + }, + { + "epoch": 0.07, + "learning_rate": 4.986932715411239e-05, + "loss": 0.9687, + "step": 230 + }, + { + "epoch": 0.07, + "learning_rate": 4.985772830308771e-05, + "loss": 0.9677, + "step": 240 + }, + { + "epoch": 0.07, + "learning_rate": 4.9845637798619536e-05, + "loss": 0.9715, + "step": 250 + }, + { + "epoch": 0.07, + "learning_rate": 4.983305587984227e-05, + "loss": 0.9692, + "step": 260 + }, + { + "epoch": 0.08, + "learning_rate": 4.981998279560986e-05, + "loss": 0.9627, + "step": 270 + }, + { + "epoch": 0.08, + "learning_rate": 4.980641880449086e-05, + "loss": 0.9784, + "step": 280 + }, + { + "epoch": 0.08, + "learning_rate": 4.9792364174763323e-05, + "loss": 0.941, + "step": 290 + }, + { + "epoch": 0.08, + "learning_rate": 4.977781918440949e-05, + "loss": 0.9623, + "step": 300 + }, + { + "epoch": 0.09, + "learning_rate": 4.97627841211103e-05, + "loss": 0.9401, + "step": 310 + }, + { + "epoch": 0.09, + "learning_rate": 4.97472592822397e-05, + "loss": 0.9152, + "step": 320 + }, + { + "epoch": 0.09, + "learning_rate": 4.9731244974858746e-05, + "loss": 0.9405, + "step": 330 + }, + { + "epoch": 0.1, + "learning_rate": 4.971474151570955e-05, + "loss": 0.9431, + "step": 340 + }, + { + "epoch": 0.1, + "learning_rate": 4.9697749231209025e-05, + "loss": 0.9512, + "step": 350 + }, + { + "epoch": 0.1, + "learning_rate": 4.968026845744237e-05, + "loss": 0.9301, + "step": 360 + }, + { + "epoch": 0.1, + "learning_rate": 4.96622995401565e-05, + "loss": 0.917, + "step": 370 + }, + { + "epoch": 0.11, + "learning_rate": 4.9643842834753174e-05, + "loss": 0.9162, + "step": 380 + }, + { + "epoch": 0.11, + "learning_rate": 4.962489870628193e-05, + "loss": 0.9207, + "step": 390 + }, + { + "epoch": 0.11, + "learning_rate": 4.960546752943294e-05, + "loss": 0.924, + "step": 400 + }, + { + "epoch": 0.12, + "learning_rate": 4.958554968852952e-05, + "loss": 0.9025, + "step": 410 + }, + { + "epoch": 0.12, + "learning_rate": 4.95651455775206e-05, + "loss": 0.9027, + "step": 420 + }, + { + "epoch": 0.12, + "learning_rate": 4.954425559997287e-05, + "loss": 0.9167, + "step": 430 + }, + { + "epoch": 0.12, + "learning_rate": 4.952288016906284e-05, + "loss": 0.9119, + "step": 440 + }, + { + "epoch": 0.13, + "learning_rate": 4.9501019707568665e-05, + "loss": 0.9042, + "step": 450 + }, + { + "epoch": 0.13, + "learning_rate": 4.947867464786174e-05, + "loss": 0.9113, + "step": 460 + }, + { + "epoch": 0.13, + "learning_rate": 4.945584543189823e-05, + "loss": 0.9297, + "step": 470 + }, + { + "epoch": 0.14, + "learning_rate": 4.943253251121022e-05, + "loss": 0.9194, + "step": 480 + }, + { + "epoch": 0.14, + "learning_rate": 4.9408736346896894e-05, + "loss": 0.8978, + "step": 490 + }, + { + "epoch": 0.14, + "learning_rate": 4.938445740961534e-05, + "loss": 0.9217, + "step": 500 + }, + { + "epoch": 0.14, + "learning_rate": 4.935969617957126e-05, + "loss": 0.8997, + "step": 510 + }, + { + "epoch": 0.15, + "learning_rate": 4.93344531465095e-05, + "loss": 0.9045, + "step": 520 + }, + { + "epoch": 0.15, + "learning_rate": 4.930872880970432e-05, + "loss": 0.8985, + "step": 530 + }, + { + "epoch": 0.15, + "learning_rate": 4.9282523677949556e-05, + "loss": 0.9171, + "step": 540 + }, + { + "epoch": 0.16, + "learning_rate": 4.9255838269548524e-05, + "loss": 0.9001, + "step": 550 + }, + { + "epoch": 0.16, + "learning_rate": 4.9228673112303814e-05, + "loss": 0.8824, + "step": 560 + }, + { + "epoch": 0.16, + "learning_rate": 4.9201028743506794e-05, + "loss": 0.9046, + "step": 570 + }, + { + "epoch": 0.16, + "learning_rate": 4.917290570992702e-05, + "loss": 0.8888, + "step": 580 + }, + { + "epoch": 0.17, + "learning_rate": 4.9144304567801415e-05, + "loss": 0.889, + "step": 590 + }, + { + "epoch": 0.17, + "learning_rate": 4.911522588282327e-05, + "loss": 0.906, + "step": 600 + }, + { + "epoch": 0.17, + "learning_rate": 4.908567023013104e-05, + "loss": 0.8858, + "step": 610 + }, + { + "epoch": 0.18, + "learning_rate": 4.9055638194296994e-05, + "loss": 0.8862, + "step": 620 + }, + { + "epoch": 0.18, + "learning_rate": 4.902513036931562e-05, + "loss": 0.8983, + "step": 630 + }, + { + "epoch": 0.18, + "learning_rate": 4.89941473585919e-05, + "loss": 0.8967, + "step": 640 + }, + { + "epoch": 0.18, + "learning_rate": 4.89626897749294e-05, + "loss": 0.8925, + "step": 650 + }, + { + "epoch": 0.19, + "learning_rate": 4.893075824051807e-05, + "loss": 0.883, + "step": 660 + }, + { + "epoch": 0.19, + "learning_rate": 4.889835338692201e-05, + "loss": 0.8823, + "step": 670 + }, + { + "epoch": 0.19, + "learning_rate": 4.886547585506698e-05, + "loss": 0.8937, + "step": 680 + }, + { + "epoch": 0.2, + "learning_rate": 4.8832126295227656e-05, + "loss": 0.8695, + "step": 690 + }, + { + "epoch": 0.2, + "learning_rate": 4.879830536701485e-05, + "loss": 0.8873, + "step": 700 + }, + { + "epoch": 0.2, + "learning_rate": 4.876401373936239e-05, + "loss": 0.8862, + "step": 710 + }, + { + "epoch": 0.2, + "learning_rate": 4.8729252090513964e-05, + "loss": 0.874, + "step": 720 + }, + { + "epoch": 0.21, + "learning_rate": 4.869402110800963e-05, + "loss": 0.8834, + "step": 730 + }, + { + "epoch": 0.21, + "learning_rate": 4.865832148867228e-05, + "loss": 0.8744, + "step": 740 + }, + { + "epoch": 0.21, + "learning_rate": 4.8622153938593816e-05, + "loss": 0.876, + "step": 750 + }, + { + "epoch": 0.22, + "learning_rate": 4.8585519173121205e-05, + "loss": 0.8874, + "step": 760 + }, + { + "epoch": 0.22, + "learning_rate": 4.8548417916842324e-05, + "loss": 0.8938, + "step": 770 + }, + { + "epoch": 0.22, + "learning_rate": 4.851085090357163e-05, + "loss": 0.8855, + "step": 780 + }, + { + "epoch": 0.22, + "learning_rate": 4.847281887633565e-05, + "loss": 0.8827, + "step": 790 + }, + { + "epoch": 0.23, + "learning_rate": 4.843432258735827e-05, + "loss": 0.8736, + "step": 800 + }, + { + "epoch": 0.23, + "learning_rate": 4.839536279804589e-05, + "loss": 0.8907, + "step": 810 + }, + { + "epoch": 0.23, + "learning_rate": 4.835594027897231e-05, + "loss": 0.862, + "step": 820 + }, + { + "epoch": 0.23, + "learning_rate": 4.831605580986355e-05, + "loss": 0.8796, + "step": 830 + }, + { + "epoch": 0.24, + "learning_rate": 4.8275710179582366e-05, + "loss": 0.8745, + "step": 840 + }, + { + "epoch": 0.24, + "learning_rate": 4.823490418611273e-05, + "loss": 0.8594, + "step": 850 + }, + { + "epoch": 0.24, + "learning_rate": 4.819363863654395e-05, + "loss": 0.8839, + "step": 860 + }, + { + "epoch": 0.25, + "learning_rate": 4.8151914347054776e-05, + "loss": 0.8536, + "step": 870 + }, + { + "epoch": 0.25, + "learning_rate": 4.810973214289724e-05, + "loss": 0.8765, + "step": 880 + }, + { + "epoch": 0.25, + "learning_rate": 4.806709285838031e-05, + "loss": 0.8726, + "step": 890 + }, + { + "epoch": 0.25, + "learning_rate": 4.8023997336853434e-05, + "loss": 0.8664, + "step": 900 + }, + { + "epoch": 0.26, + "learning_rate": 4.7980446430689804e-05, + "loss": 0.8805, + "step": 910 + }, + { + "epoch": 0.26, + "learning_rate": 4.793644100126954e-05, + "loss": 0.878, + "step": 920 + }, + { + "epoch": 0.26, + "learning_rate": 4.7891981918962656e-05, + "loss": 0.8632, + "step": 930 + }, + { + "epoch": 0.27, + "learning_rate": 4.784707006311179e-05, + "loss": 0.8614, + "step": 940 + }, + { + "epoch": 0.27, + "learning_rate": 4.780170632201487e-05, + "loss": 0.8629, + "step": 950 + }, + { + "epoch": 0.27, + "learning_rate": 4.7755891592907556e-05, + "loss": 0.8635, + "step": 960 + }, + { + "epoch": 0.27, + "learning_rate": 4.7709626781945397e-05, + "loss": 0.8525, + "step": 970 + }, + { + "epoch": 0.28, + "learning_rate": 4.766291280418603e-05, + "loss": 0.8592, + "step": 980 + }, + { + "epoch": 0.28, + "learning_rate": 4.761575058357101e-05, + "loss": 0.8621, + "step": 990 + }, + { + "epoch": 0.28, + "learning_rate": 4.756814105290753e-05, + "loss": 0.8687, + "step": 1000 + }, + { + "epoch": 0.29, + "learning_rate": 4.7520085153850014e-05, + "loss": 0.8524, + "step": 1010 + }, + { + "epoch": 0.29, + "learning_rate": 4.7471583836881476e-05, + "loss": 0.8687, + "step": 1020 + }, + { + "epoch": 0.29, + "learning_rate": 4.742263806129469e-05, + "loss": 0.8505, + "step": 1030 + }, + { + "epoch": 0.29, + "learning_rate": 4.737324879517326e-05, + "loss": 0.8754, + "step": 1040 + }, + { + "epoch": 0.3, + "learning_rate": 4.732341701537245e-05, + "loss": 0.8583, + "step": 1050 + }, + { + "epoch": 0.3, + "learning_rate": 4.727314370749988e-05, + "loss": 0.8698, + "step": 1060 + }, + { + "epoch": 0.3, + "learning_rate": 4.7222429865896e-05, + "loss": 0.8661, + "step": 1070 + }, + { + "epoch": 0.31, + "learning_rate": 4.717127649361444e-05, + "loss": 0.8574, + "step": 1080 + }, + { + "epoch": 0.31, + "learning_rate": 4.71196846024022e-05, + "loss": 0.852, + "step": 1090 + }, + { + "epoch": 0.31, + "learning_rate": 4.7067655212679585e-05, + "loss": 0.8619, + "step": 1100 + }, + { + "epoch": 0.31, + "learning_rate": 4.701518935352006e-05, + "loss": 0.8632, + "step": 1110 + }, + { + "epoch": 0.32, + "learning_rate": 4.69622880626299e-05, + "loss": 0.8529, + "step": 1120 + }, + { + "epoch": 0.32, + "learning_rate": 4.690895238632762e-05, + "loss": 0.8529, + "step": 1130 + }, + { + "epoch": 0.32, + "learning_rate": 4.685518337952335e-05, + "loss": 0.8465, + "step": 1140 + }, + { + "epoch": 0.33, + "learning_rate": 4.680098210569789e-05, + "loss": 0.8604, + "step": 1150 + }, + { + "epoch": 0.33, + "learning_rate": 4.674634963688177e-05, + "loss": 0.8649, + "step": 1160 + }, + { + "epoch": 0.33, + "learning_rate": 4.669128705363394e-05, + "loss": 0.8572, + "step": 1170 + }, + { + "epoch": 0.33, + "learning_rate": 4.663579544502049e-05, + "loss": 0.8634, + "step": 1180 + }, + { + "epoch": 0.34, + "learning_rate": 4.657987590859305e-05, + "loss": 0.8478, + "step": 1190 + }, + { + "epoch": 0.34, + "learning_rate": 4.652352955036713e-05, + "loss": 0.8475, + "step": 1200 + }, + { + "epoch": 0.34, + "learning_rate": 4.646675748480019e-05, + "loss": 0.8537, + "step": 1210 + }, + { + "epoch": 0.35, + "learning_rate": 4.640956083476964e-05, + "loss": 0.8499, + "step": 1220 + }, + { + "epoch": 0.35, + "learning_rate": 4.635194073155061e-05, + "loss": 0.8467, + "step": 1230 + }, + { + "epoch": 0.35, + "learning_rate": 4.62938983147936e-05, + "loss": 0.8538, + "step": 1240 + }, + { + "epoch": 0.35, + "learning_rate": 4.62354347325019e-05, + "loss": 0.8619, + "step": 1250 + }, + { + "epoch": 0.36, + "learning_rate": 4.6176551141008916e-05, + "loss": 0.8593, + "step": 1260 + }, + { + "epoch": 0.36, + "learning_rate": 4.611724870495528e-05, + "loss": 0.8484, + "step": 1270 + }, + { + "epoch": 0.36, + "learning_rate": 4.605752859726583e-05, + "loss": 0.8395, + "step": 1280 + }, + { + "epoch": 0.37, + "learning_rate": 4.5997391999126397e-05, + "loss": 0.8547, + "step": 1290 + }, + { + "epoch": 0.37, + "learning_rate": 4.5936840099960465e-05, + "loss": 0.8586, + "step": 1300 + }, + { + "epoch": 0.37, + "learning_rate": 4.587587409740561e-05, + "loss": 0.839, + "step": 1310 + }, + { + "epoch": 0.37, + "learning_rate": 4.581449519728986e-05, + "loss": 0.8417, + "step": 1320 + }, + { + "epoch": 0.38, + "learning_rate": 4.575270461360779e-05, + "loss": 0.8404, + "step": 1330 + }, + { + "epoch": 0.38, + "learning_rate": 4.569050356849655e-05, + "loss": 0.843, + "step": 1340 + }, + { + "epoch": 0.38, + "learning_rate": 4.562789329221169e-05, + "loss": 0.8557, + "step": 1350 + }, + { + "epoch": 0.39, + "learning_rate": 4.5564875023102796e-05, + "loss": 0.8504, + "step": 1360 + }, + { + "epoch": 0.39, + "learning_rate": 4.550145000758905e-05, + "loss": 0.8579, + "step": 1370 + }, + { + "epoch": 0.39, + "learning_rate": 4.543761950013453e-05, + "loss": 0.8563, + "step": 1380 + }, + { + "epoch": 0.39, + "learning_rate": 4.537338476322341e-05, + "loss": 0.8446, + "step": 1390 + }, + { + "epoch": 0.4, + "learning_rate": 4.530874706733502e-05, + "loss": 0.8524, + "step": 1400 + }, + { + "epoch": 0.4, + "learning_rate": 4.524370769091866e-05, + "loss": 0.8417, + "step": 1410 + }, + { + "epoch": 0.4, + "learning_rate": 4.5178267920368366e-05, + "loss": 0.8582, + "step": 1420 + }, + { + "epoch": 0.4, + "learning_rate": 4.511242904999746e-05, + "loss": 0.841, + "step": 1430 + }, + { + "epoch": 0.41, + "learning_rate": 4.50461923820129e-05, + "loss": 0.8529, + "step": 1440 + }, + { + "epoch": 0.41, + "learning_rate": 4.497955922648961e-05, + "loss": 0.8545, + "step": 1450 + }, + { + "epoch": 0.41, + "learning_rate": 4.491253090134447e-05, + "loss": 0.8471, + "step": 1460 + }, + { + "epoch": 0.42, + "learning_rate": 4.4845108732310355e-05, + "loss": 0.8379, + "step": 1470 + }, + { + "epoch": 0.42, + "learning_rate": 4.4777294052909804e-05, + "loss": 0.8542, + "step": 1480 + }, + { + "epoch": 0.42, + "learning_rate": 4.470908820442873e-05, + "loss": 0.8463, + "step": 1490 + }, + { + "epoch": 0.42, + "learning_rate": 4.464049253588985e-05, + "loss": 0.8362, + "step": 1500 + }, + { + "epoch": 0.43, + "learning_rate": 4.457150840402604e-05, + "loss": 0.8467, + "step": 1510 + }, + { + "epoch": 0.43, + "learning_rate": 4.450213717325343e-05, + "loss": 0.8501, + "step": 1520 + }, + { + "epoch": 0.43, + "learning_rate": 4.443238021564448e-05, + "loss": 0.8541, + "step": 1530 + }, + { + "epoch": 0.44, + "learning_rate": 4.4362238910900835e-05, + "loss": 0.8443, + "step": 1540 + }, + { + "epoch": 0.44, + "learning_rate": 4.4291714646326024e-05, + "loss": 0.8297, + "step": 1550 + }, + { + "epoch": 0.44, + "learning_rate": 4.4220808816797995e-05, + "loss": 0.8532, + "step": 1560 + }, + { + "epoch": 0.44, + "learning_rate": 4.414952282474158e-05, + "loss": 0.854, + "step": 1570 + }, + { + "epoch": 0.45, + "learning_rate": 4.407785808010073e-05, + "loss": 0.849, + "step": 1580 + }, + { + "epoch": 0.45, + "learning_rate": 4.400581600031062e-05, + "loss": 0.8516, + "step": 1590 + }, + { + "epoch": 0.45, + "learning_rate": 4.3933398010269614e-05, + "loss": 0.8394, + "step": 1600 + }, + { + "epoch": 0.46, + "learning_rate": 4.386060554231111e-05, + "loss": 0.8399, + "step": 1610 + }, + { + "epoch": 0.46, + "learning_rate": 4.378744003617517e-05, + "loss": 0.8242, + "step": 1620 + }, + { + "epoch": 0.46, + "learning_rate": 4.371390293898007e-05, + "loss": 0.8395, + "step": 1630 + }, + { + "epoch": 0.46, + "learning_rate": 4.3639995705193684e-05, + "loss": 0.8355, + "step": 1640 + }, + { + "epoch": 0.47, + "learning_rate": 4.3565719796604706e-05, + "loss": 0.8299, + "step": 1650 + }, + { + "epoch": 0.47, + "learning_rate": 4.3491076682293715e-05, + "loss": 0.8272, + "step": 1660 + }, + { + "epoch": 0.47, + "learning_rate": 4.341606783860416e-05, + "loss": 0.8336, + "step": 1670 + }, + { + "epoch": 0.48, + "learning_rate": 4.334069474911313e-05, + "loss": 0.8264, + "step": 1680 + }, + { + "epoch": 0.48, + "learning_rate": 4.326495890460204e-05, + "loss": 0.8381, + "step": 1690 + }, + { + "epoch": 0.48, + "learning_rate": 4.3188861803027094e-05, + "loss": 0.8278, + "step": 1700 + }, + { + "epoch": 0.48, + "learning_rate": 4.3112404949489715e-05, + "loss": 0.8458, + "step": 1710 + }, + { + "epoch": 0.49, + "learning_rate": 4.303558985620673e-05, + "loss": 0.8348, + "step": 1720 + }, + { + "epoch": 0.49, + "learning_rate": 4.2958418042480506e-05, + "loss": 0.814, + "step": 1730 + }, + { + "epoch": 0.49, + "learning_rate": 4.288089103466886e-05, + "loss": 0.838, + "step": 1740 + }, + { + "epoch": 0.5, + "learning_rate": 4.280301036615489e-05, + "loss": 0.824, + "step": 1750 + }, + { + "epoch": 0.5, + "learning_rate": 4.272477757731662e-05, + "loss": 0.8314, + "step": 1760 + }, + { + "epoch": 0.5, + "learning_rate": 4.2646194215496595e-05, + "loss": 0.821, + "step": 1770 + }, + { + "epoch": 0.5, + "learning_rate": 4.2567261834971206e-05, + "loss": 0.8311, + "step": 1780 + }, + { + "epoch": 0.51, + "learning_rate": 4.248798199691998e-05, + "loss": 0.8443, + "step": 1790 + }, + { + "epoch": 0.51, + "learning_rate": 4.2408356269394714e-05, + "loss": 0.8315, + "step": 1800 + }, + { + "epoch": 0.51, + "learning_rate": 4.2328386227288445e-05, + "loss": 0.8184, + "step": 1810 + }, + { + "epoch": 0.52, + "learning_rate": 4.224807345230429e-05, + "loss": 0.8364, + "step": 1820 + }, + { + "epoch": 0.52, + "learning_rate": 4.21674195329242e-05, + "loss": 0.8186, + "step": 1830 + }, + { + "epoch": 0.52, + "learning_rate": 4.208642606437748e-05, + "loss": 0.8454, + "step": 1840 + }, + { + "epoch": 0.52, + "learning_rate": 4.2005094648609325e-05, + "loss": 0.832, + "step": 1850 + }, + { + "epoch": 0.53, + "learning_rate": 4.192342689424903e-05, + "loss": 0.8027, + "step": 1860 + }, + { + "epoch": 0.53, + "learning_rate": 4.184142441657827e-05, + "loss": 0.8365, + "step": 1870 + }, + { + "epoch": 0.53, + "learning_rate": 4.1759088837499095e-05, + "loss": 0.8523, + "step": 1880 + }, + { + "epoch": 0.54, + "learning_rate": 4.167642178550186e-05, + "loss": 0.8377, + "step": 1890 + }, + { + "epoch": 0.54, + "learning_rate": 4.159342489563304e-05, + "loss": 0.8299, + "step": 1900 + }, + { + "epoch": 0.54, + "learning_rate": 4.151009980946287e-05, + "loss": 0.8273, + "step": 1910 + }, + { + "epoch": 0.54, + "learning_rate": 4.142644817505284e-05, + "loss": 0.813, + "step": 1920 + }, + { + "epoch": 0.55, + "learning_rate": 4.1342471646923196e-05, + "loss": 0.8262, + "step": 1930 + }, + { + "epoch": 0.55, + "learning_rate": 4.1258171886020124e-05, + "loss": 0.8258, + "step": 1940 + }, + { + "epoch": 0.55, + "learning_rate": 4.117355055968295e-05, + "loss": 0.8248, + "step": 1950 + }, + { + "epoch": 0.55, + "learning_rate": 4.1088609341611135e-05, + "loss": 0.8123, + "step": 1960 + }, + { + "epoch": 0.56, + "learning_rate": 4.1003349911831166e-05, + "loss": 0.8304, + "step": 1970 + }, + { + "epoch": 0.56, + "learning_rate": 4.091777395666338e-05, + "loss": 0.849, + "step": 1980 + }, + { + "epoch": 0.56, + "learning_rate": 4.0831883168688534e-05, + "loss": 0.8255, + "step": 1990 + }, + { + "epoch": 0.57, + "learning_rate": 4.07456792467144e-05, + "loss": 0.8317, + "step": 2000 + }, + { + "epoch": 0.57, + "learning_rate": 4.065916389574211e-05, + "loss": 0.8331, + "step": 2010 + }, + { + "epoch": 0.57, + "learning_rate": 4.057233882693246e-05, + "loss": 0.8309, + "step": 2020 + }, + { + "epoch": 0.57, + "learning_rate": 4.048520575757207e-05, + "loss": 0.8117, + "step": 2030 + }, + { + "epoch": 0.58, + "learning_rate": 4.0397766411039395e-05, + "loss": 0.8155, + "step": 2040 + }, + { + "epoch": 0.58, + "learning_rate": 4.031002251677067e-05, + "loss": 0.8178, + "step": 2050 + }, + { + "epoch": 0.58, + "learning_rate": 4.022197581022567e-05, + "loss": 0.8155, + "step": 2060 + }, + { + "epoch": 0.59, + "learning_rate": 4.0133628032853435e-05, + "loss": 0.8273, + "step": 2070 + }, + { + "epoch": 0.59, + "learning_rate": 4.004498093205773e-05, + "loss": 0.8021, + "step": 2080 + }, + { + "epoch": 0.59, + "learning_rate": 3.99560362611626e-05, + "loss": 0.8374, + "step": 2090 + }, + { + "epoch": 0.59, + "learning_rate": 3.986679577937762e-05, + "loss": 0.8173, + "step": 2100 + }, + { + "epoch": 0.6, + "learning_rate": 3.9777261251763145e-05, + "loss": 0.8227, + "step": 2110 + }, + { + "epoch": 0.6, + "learning_rate": 3.9687434449195316e-05, + "loss": 0.8275, + "step": 2120 + }, + { + "epoch": 0.6, + "learning_rate": 3.959731714833115e-05, + "loss": 0.8226, + "step": 2130 + }, + { + "epoch": 0.61, + "learning_rate": 3.95069111315733e-05, + "loss": 0.815, + "step": 2140 + }, + { + "epoch": 0.61, + "learning_rate": 3.9416218187034876e-05, + "loss": 0.8306, + "step": 2150 + }, + { + "epoch": 0.61, + "learning_rate": 3.9325240108504016e-05, + "loss": 0.8424, + "step": 2160 + }, + { + "epoch": 0.61, + "learning_rate": 3.923397869540845e-05, + "loss": 0.8051, + "step": 2170 + }, + { + "epoch": 0.62, + "learning_rate": 3.91424357527799e-05, + "loss": 0.8117, + "step": 2180 + }, + { + "epoch": 0.62, + "learning_rate": 3.905061309121837e-05, + "loss": 0.8123, + "step": 2190 + }, + { + "epoch": 0.62, + "learning_rate": 3.895851252685634e-05, + "loss": 0.8038, + "step": 2200 + }, + { + "epoch": 0.63, + "learning_rate": 3.886613588132284e-05, + "loss": 0.8308, + "step": 2210 + }, + { + "epoch": 0.63, + "learning_rate": 3.877348498170743e-05, + "loss": 0.8187, + "step": 2220 + }, + { + "epoch": 0.63, + "learning_rate": 3.868056166052407e-05, + "loss": 0.8274, + "step": 2230 + }, + { + "epoch": 0.63, + "learning_rate": 3.858736775567484e-05, + "loss": 0.8171, + "step": 2240 + }, + { + "epoch": 0.64, + "learning_rate": 3.8493905110413626e-05, + "loss": 0.8213, + "step": 2250 + }, + { + "epoch": 0.64, + "learning_rate": 3.8400175573309646e-05, + "loss": 0.8241, + "step": 2260 + }, + { + "epoch": 0.64, + "learning_rate": 3.83061809982109e-05, + "loss": 0.8296, + "step": 2270 + }, + { + "epoch": 0.65, + "learning_rate": 3.821192324420747e-05, + "loss": 0.8247, + "step": 2280 + }, + { + "epoch": 0.65, + "learning_rate": 3.8117404175594795e-05, + "loss": 0.8399, + "step": 2290 + }, + { + "epoch": 0.65, + "learning_rate": 3.8022625661836775e-05, + "loss": 0.8015, + "step": 2300 + }, + { + "epoch": 0.65, + "learning_rate": 3.792758957752879e-05, + "loss": 0.8204, + "step": 2310 + }, + { + "epoch": 0.66, + "learning_rate": 3.783229780236062e-05, + "loss": 0.8198, + "step": 2320 + }, + { + "epoch": 0.66, + "learning_rate": 3.773675222107929e-05, + "loss": 0.8045, + "step": 2330 + }, + { + "epoch": 0.66, + "learning_rate": 3.7640954723451784e-05, + "loss": 0.8185, + "step": 2340 + }, + { + "epoch": 0.67, + "learning_rate": 3.7544907204227646e-05, + "loss": 0.8123, + "step": 2350 + }, + { + "epoch": 0.67, + "learning_rate": 3.7448611563101536e-05, + "loss": 0.8093, + "step": 2360 + }, + { + "epoch": 0.67, + "learning_rate": 3.735206970467564e-05, + "loss": 0.8194, + "step": 2370 + }, + { + "epoch": 0.67, + "learning_rate": 3.7255283538421984e-05, + "loss": 0.8121, + "step": 2380 + }, + { + "epoch": 0.68, + "learning_rate": 3.7158254978644703e-05, + "loss": 0.811, + "step": 2390 + }, + { + "epoch": 0.68, + "learning_rate": 3.706098594444216e-05, + "loss": 0.8013, + "step": 2400 + }, + { + "epoch": 0.68, + "learning_rate": 3.6963478359668966e-05, + "loss": 0.8215, + "step": 2410 + }, + { + "epoch": 0.69, + "learning_rate": 3.6865734152897987e-05, + "loss": 0.8079, + "step": 2420 + }, + { + "epoch": 0.69, + "learning_rate": 3.676775525738213e-05, + "loss": 0.821, + "step": 2430 + }, + { + "epoch": 0.69, + "learning_rate": 3.666954361101616e-05, + "loss": 0.8097, + "step": 2440 + }, + { + "epoch": 0.69, + "learning_rate": 3.657110115629832e-05, + "loss": 0.8046, + "step": 2450 + }, + { + "epoch": 0.7, + "learning_rate": 3.647242984029201e-05, + "loss": 0.8112, + "step": 2460 + }, + { + "epoch": 0.7, + "learning_rate": 3.637353161458713e-05, + "loss": 0.8099, + "step": 2470 + }, + { + "epoch": 0.7, + "learning_rate": 3.627440843526158e-05, + "loss": 0.8148, + "step": 2480 + }, + { + "epoch": 0.7, + "learning_rate": 3.6175062262842585e-05, + "loss": 0.8105, + "step": 2490 + }, + { + "epoch": 0.71, + "learning_rate": 3.607549506226784e-05, + "loss": 0.8132, + "step": 2500 + }, + { + "epoch": 0.71, + "learning_rate": 3.5975708802846725e-05, + "loss": 0.8149, + "step": 2510 + }, + { + "epoch": 0.71, + "learning_rate": 3.587570545822128e-05, + "loss": 0.8306, + "step": 2520 + }, + { + "epoch": 0.72, + "learning_rate": 3.5775487006327215e-05, + "loss": 0.8106, + "step": 2530 + }, + { + "epoch": 0.72, + "learning_rate": 3.567505542935482e-05, + "loss": 0.8192, + "step": 2540 + }, + { + "epoch": 0.72, + "learning_rate": 3.557441271370968e-05, + "loss": 0.8129, + "step": 2550 + }, + { + "epoch": 0.72, + "learning_rate": 3.547356084997344e-05, + "loss": 0.8155, + "step": 2560 + }, + { + "epoch": 0.73, + "learning_rate": 3.537250183286443e-05, + "loss": 0.8039, + "step": 2570 + }, + { + "epoch": 0.73, + "learning_rate": 3.527123766119818e-05, + "loss": 0.8109, + "step": 2580 + }, + { + "epoch": 0.73, + "learning_rate": 3.5169770337847935e-05, + "loss": 0.8063, + "step": 2590 + }, + { + "epoch": 0.74, + "learning_rate": 3.5068101869705004e-05, + "loss": 0.8275, + "step": 2600 + }, + { + "epoch": 0.74, + "learning_rate": 3.496623426763908e-05, + "loss": 0.8107, + "step": 2610 + }, + { + "epoch": 0.74, + "learning_rate": 3.486416954645846e-05, + "loss": 0.8047, + "step": 2620 + }, + { + "epoch": 0.74, + "learning_rate": 3.4761909724870205e-05, + "loss": 0.8123, + "step": 2630 + }, + { + "epoch": 0.75, + "learning_rate": 3.4659456825440216e-05, + "loss": 0.8241, + "step": 2640 + }, + { + "epoch": 0.75, + "learning_rate": 3.4556812874553204e-05, + "loss": 0.812, + "step": 2650 + }, + { + "epoch": 0.75, + "learning_rate": 3.445397990237264e-05, + "loss": 0.8161, + "step": 2660 + }, + { + "epoch": 0.76, + "learning_rate": 3.4350959942800584e-05, + "loss": 0.797, + "step": 2670 + }, + { + "epoch": 0.76, + "learning_rate": 3.424775503343747e-05, + "loss": 0.8155, + "step": 2680 + }, + { + "epoch": 0.76, + "learning_rate": 3.414436721554179e-05, + "loss": 0.797, + "step": 2690 + }, + { + "epoch": 0.76, + "learning_rate": 3.4040798533989745e-05, + "loss": 0.8153, + "step": 2700 + }, + { + "epoch": 0.77, + "learning_rate": 3.3937051037234745e-05, + "loss": 0.8016, + "step": 2710 + }, + { + "epoch": 0.77, + "learning_rate": 3.3833126777266974e-05, + "loss": 0.8138, + "step": 2720 + }, + { + "epoch": 0.77, + "learning_rate": 3.3729027809572735e-05, + "loss": 0.8178, + "step": 2730 + }, + { + "epoch": 0.78, + "learning_rate": 3.3624756193093835e-05, + "loss": 0.8062, + "step": 2740 + }, + { + "epoch": 0.78, + "learning_rate": 3.3520313990186856e-05, + "loss": 0.8101, + "step": 2750 + }, + { + "epoch": 0.78, + "learning_rate": 3.341570326658232e-05, + "loss": 0.7982, + "step": 2760 + }, + { + "epoch": 0.78, + "learning_rate": 3.331092609134392e-05, + "loss": 0.8021, + "step": 2770 + }, + { + "epoch": 0.79, + "learning_rate": 3.32059845368275e-05, + "loss": 0.817, + "step": 2780 + }, + { + "epoch": 0.79, + "learning_rate": 3.310088067864015e-05, + "loss": 0.8083, + "step": 2790 + }, + { + "epoch": 0.79, + "learning_rate": 3.299561659559909e-05, + "loss": 0.8047, + "step": 2800 + }, + { + "epoch": 0.8, + "learning_rate": 3.289019436969057e-05, + "loss": 0.8, + "step": 2810 + }, + { + "epoch": 0.8, + "learning_rate": 3.278461608602873e-05, + "loss": 0.8063, + "step": 2820 + }, + { + "epoch": 0.8, + "learning_rate": 3.267888383281431e-05, + "loss": 0.8139, + "step": 2830 + }, + { + "epoch": 0.8, + "learning_rate": 3.257299970129336e-05, + "loss": 0.8075, + "step": 2840 + }, + { + "epoch": 0.81, + "learning_rate": 3.246696578571592e-05, + "loss": 0.8056, + "step": 2850 + }, + { + "epoch": 0.81, + "learning_rate": 3.236078418329452e-05, + "loss": 0.8242, + "step": 2860 + }, + { + "epoch": 0.81, + "learning_rate": 3.225445699416276e-05, + "loss": 0.8041, + "step": 2870 + }, + { + "epoch": 0.82, + "learning_rate": 3.214798632133376e-05, + "loss": 0.8088, + "step": 2880 + }, + { + "epoch": 0.82, + "learning_rate": 3.204137427065857e-05, + "loss": 0.8121, + "step": 2890 + }, + { + "epoch": 0.82, + "learning_rate": 3.193462295078448e-05, + "loss": 0.8151, + "step": 2900 + }, + { + "epoch": 0.82, + "learning_rate": 3.1827734473113356e-05, + "loss": 0.8064, + "step": 2910 + }, + { + "epoch": 0.83, + "learning_rate": 3.172071095175989e-05, + "loss": 0.8151, + "step": 2920 + }, + { + "epoch": 0.83, + "learning_rate": 3.1613554503509715e-05, + "loss": 0.7942, + "step": 2930 + }, + { + "epoch": 0.83, + "learning_rate": 3.1506267247777645e-05, + "loss": 0.8131, + "step": 2940 + }, + { + "epoch": 0.84, + "learning_rate": 3.139885130656563e-05, + "loss": 0.8015, + "step": 2950 + }, + { + "epoch": 0.84, + "learning_rate": 3.129130880442091e-05, + "loss": 0.8053, + "step": 2960 + }, + { + "epoch": 0.84, + "learning_rate": 3.118364186839389e-05, + "loss": 0.7986, + "step": 2970 + }, + { + "epoch": 0.84, + "learning_rate": 3.107585262799613e-05, + "loss": 0.7936, + "step": 2980 + }, + { + "epoch": 0.85, + "learning_rate": 3.096794321515823e-05, + "loss": 0.8235, + "step": 2990 + }, + { + "epoch": 0.85, + "learning_rate": 3.0859915764187616e-05, + "loss": 0.8083, + "step": 3000 + }, + { + "epoch": 0.85, + "learning_rate": 3.075177241172637e-05, + "loss": 0.8081, + "step": 3010 + }, + { + "epoch": 0.86, + "learning_rate": 3.064351529670895e-05, + "loss": 0.7981, + "step": 3020 + }, + { + "epoch": 0.86, + "learning_rate": 3.0535146560319895e-05, + "loss": 0.8152, + "step": 3030 + }, + { + "epoch": 0.86, + "learning_rate": 3.0426668345951448e-05, + "loss": 0.8091, + "step": 3040 + }, + { + "epoch": 0.86, + "learning_rate": 3.031808279916121e-05, + "loss": 0.8206, + "step": 3050 + }, + { + "epoch": 0.87, + "learning_rate": 3.0209392067629676e-05, + "loss": 0.7947, + "step": 3060 + }, + { + "epoch": 0.87, + "learning_rate": 3.010059830111773e-05, + "loss": 0.8116, + "step": 3070 + }, + { + "epoch": 0.87, + "learning_rate": 2.9991703651424184e-05, + "loss": 0.8135, + "step": 3080 + }, + { + "epoch": 0.87, + "learning_rate": 2.988271027234317e-05, + "loss": 0.8032, + "step": 3090 + }, + { + "epoch": 0.88, + "learning_rate": 2.977362031962158e-05, + "loss": 0.8023, + "step": 3100 + }, + { + "epoch": 0.88, + "learning_rate": 2.966443595091637e-05, + "loss": 0.8116, + "step": 3110 + }, + { + "epoch": 0.88, + "learning_rate": 2.9555159325751947e-05, + "loss": 0.8048, + "step": 3120 + }, + { + "epoch": 0.89, + "learning_rate": 2.9445792605477433e-05, + "loss": 0.8032, + "step": 3130 + }, + { + "epoch": 0.89, + "learning_rate": 2.933633795322391e-05, + "loss": 0.808, + "step": 3140 + }, + { + "epoch": 0.89, + "learning_rate": 2.9226797533861615e-05, + "loss": 0.8057, + "step": 3150 + }, + { + "epoch": 0.89, + "learning_rate": 2.9117173513957186e-05, + "loss": 0.8013, + "step": 3160 + }, + { + "epoch": 0.9, + "learning_rate": 2.900746806173074e-05, + "loss": 0.802, + "step": 3170 + }, + { + "epoch": 0.9, + "learning_rate": 2.889768334701305e-05, + "loss": 0.804, + "step": 3180 + }, + { + "epoch": 0.9, + "learning_rate": 2.8787821541202564e-05, + "loss": 0.8, + "step": 3190 + }, + { + "epoch": 0.91, + "learning_rate": 2.8677884817222505e-05, + "loss": 0.7983, + "step": 3200 + }, + { + "epoch": 0.91, + "learning_rate": 2.856787534947789e-05, + "loss": 0.8083, + "step": 3210 + }, + { + "epoch": 0.91, + "learning_rate": 2.8457795313812507e-05, + "loss": 0.8203, + "step": 3220 + }, + { + "epoch": 0.91, + "learning_rate": 2.8347646887465867e-05, + "loss": 0.792, + "step": 3230 + }, + { + "epoch": 0.92, + "learning_rate": 2.8237432249030183e-05, + "loss": 0.8006, + "step": 3240 + }, + { + "epoch": 0.92, + "learning_rate": 2.812715357840725e-05, + "loss": 0.7953, + "step": 3250 + }, + { + "epoch": 0.92, + "learning_rate": 2.801681305676534e-05, + "loss": 0.8057, + "step": 3260 + }, + { + "epoch": 0.93, + "learning_rate": 2.7906412866496034e-05, + "loss": 0.8005, + "step": 3270 + }, + { + "epoch": 0.93, + "learning_rate": 2.7795955191171114e-05, + "loss": 0.8082, + "step": 3280 + }, + { + "epoch": 0.93, + "learning_rate": 2.7685442215499323e-05, + "loss": 0.811, + "step": 3290 + }, + { + "epoch": 0.93, + "learning_rate": 2.7574876125283176e-05, + "loss": 0.7981, + "step": 3300 + }, + { + "epoch": 0.94, + "learning_rate": 2.7464259107375722e-05, + "loss": 0.8018, + "step": 3310 + }, + { + "epoch": 0.94, + "learning_rate": 2.7353593349637297e-05, + "loss": 0.7991, + "step": 3320 + }, + { + "epoch": 0.94, + "learning_rate": 2.7242881040892255e-05, + "loss": 0.8057, + "step": 3330 + }, + { + "epoch": 0.95, + "learning_rate": 2.713212437088564e-05, + "loss": 0.8156, + "step": 3340 + }, + { + "epoch": 0.95, + "learning_rate": 2.702132553023993e-05, + "loss": 0.8003, + "step": 3350 + }, + { + "epoch": 0.95, + "learning_rate": 2.691048671041169e-05, + "loss": 0.7976, + "step": 3360 + }, + { + "epoch": 0.95, + "learning_rate": 2.6799610103648197e-05, + "loss": 0.7894, + "step": 3370 + }, + { + "epoch": 0.96, + "learning_rate": 2.668869790294411e-05, + "loss": 0.7953, + "step": 3380 + }, + { + "epoch": 0.96, + "learning_rate": 2.6577752301998098e-05, + "loss": 0.8124, + "step": 3390 + }, + { + "epoch": 0.96, + "learning_rate": 2.6466775495169437e-05, + "loss": 0.8073, + "step": 3400 + }, + { + "epoch": 0.97, + "learning_rate": 2.6355769677434628e-05, + "loss": 0.7979, + "step": 3410 + }, + { + "epoch": 0.97, + "learning_rate": 2.6244737044343954e-05, + "loss": 0.8023, + "step": 3420 + }, + { + "epoch": 0.97, + "learning_rate": 2.6133679791978065e-05, + "loss": 0.8046, + "step": 3430 + }, + { + "epoch": 0.97, + "learning_rate": 2.602260011690457e-05, + "loss": 0.8082, + "step": 3440 + }, + { + "epoch": 0.98, + "learning_rate": 2.591150021613456e-05, + "loss": 0.7868, + "step": 3450 + }, + { + "epoch": 0.98, + "learning_rate": 2.580038228707916e-05, + "loss": 0.7938, + "step": 3460 + }, + { + "epoch": 0.98, + "learning_rate": 2.568924852750607e-05, + "loss": 0.8215, + "step": 3470 + }, + { + "epoch": 0.99, + "learning_rate": 2.55781011354961e-05, + "loss": 0.807, + "step": 3480 + }, + { + "epoch": 0.99, + "learning_rate": 2.5466942309399706e-05, + "loss": 0.7878, + "step": 3490 + }, + { + "epoch": 0.99, + "learning_rate": 2.535577424779347e-05, + "loss": 0.7968, + "step": 3500 + }, + { + "epoch": 0.99, + "learning_rate": 2.5244599149436642e-05, + "loss": 0.787, + "step": 3510 + }, + { + "epoch": 1.0, + "learning_rate": 2.5133419213227684e-05, + "loss": 0.8011, + "step": 3520 + }, + { + "epoch": 1.0, + "learning_rate": 2.5022236638160712e-05, + "loss": 0.8086, + "step": 3530 + }, + { + "epoch": 1.0, + "learning_rate": 2.491105362328204e-05, + "loss": 0.8125, + "step": 3540 + }, + { + "epoch": 1.01, + "learning_rate": 2.4799872367646685e-05, + "loss": 0.8125, + "step": 3550 + }, + { + "epoch": 1.01, + "learning_rate": 2.468869507027486e-05, + "loss": 0.7805, + "step": 3560 + }, + { + "epoch": 1.01, + "learning_rate": 2.457752393010851e-05, + "loss": 0.817, + "step": 3570 + }, + { + "epoch": 1.01, + "learning_rate": 2.4466361145967782e-05, + "loss": 0.8056, + "step": 3580 + }, + { + "epoch": 1.02, + "learning_rate": 2.4355208916507554e-05, + "loss": 0.7752, + "step": 3590 + }, + { + "epoch": 1.02, + "learning_rate": 2.4244069440173938e-05, + "loss": 0.7749, + "step": 3600 + }, + { + "epoch": 1.02, + "learning_rate": 2.413294491516083e-05, + "loss": 0.8073, + "step": 3610 + }, + { + "epoch": 1.02, + "learning_rate": 2.402183753936639e-05, + "loss": 0.8117, + "step": 3620 + }, + { + "epoch": 1.03, + "learning_rate": 2.3910749510349574e-05, + "loss": 0.8008, + "step": 3630 + }, + { + "epoch": 1.03, + "learning_rate": 2.3799683025286727e-05, + "loss": 0.8028, + "step": 3640 + }, + { + "epoch": 1.03, + "learning_rate": 2.3688640280928043e-05, + "loss": 0.7974, + "step": 3650 + }, + { + "epoch": 1.04, + "learning_rate": 2.357762347355418e-05, + "loss": 0.7867, + "step": 3660 + }, + { + "epoch": 1.04, + "learning_rate": 2.346663479893277e-05, + "loss": 0.8002, + "step": 3670 + }, + { + "epoch": 1.04, + "learning_rate": 2.3355676452275057e-05, + "loss": 0.8095, + "step": 3680 + }, + { + "epoch": 1.04, + "learning_rate": 2.3244750628192395e-05, + "loss": 0.7847, + "step": 3690 + }, + { + "epoch": 1.05, + "learning_rate": 2.313385952065291e-05, + "loss": 0.7693, + "step": 3700 + }, + { + "epoch": 1.05, + "learning_rate": 2.302300532293806e-05, + "loss": 0.8078, + "step": 3710 + }, + { + "epoch": 1.05, + "learning_rate": 2.2912190227599305e-05, + "loss": 0.7925, + "step": 3720 + }, + { + "epoch": 1.06, + "learning_rate": 2.280141642641468e-05, + "loss": 0.77, + "step": 3730 + }, + { + "epoch": 1.06, + "learning_rate": 2.26906861103455e-05, + "loss": 0.7962, + "step": 3740 + }, + { + "epoch": 1.06, + "learning_rate": 2.2580001469492968e-05, + "loss": 0.8014, + "step": 3750 + }, + { + "epoch": 1.06, + "learning_rate": 2.2469364693054938e-05, + "loss": 0.7934, + "step": 3760 + }, + { + "epoch": 1.07, + "learning_rate": 2.235877796928252e-05, + "loss": 0.7978, + "step": 3770 + }, + { + "epoch": 1.07, + "learning_rate": 2.2248243485436892e-05, + "loss": 0.8022, + "step": 3780 + }, + { + "epoch": 1.07, + "learning_rate": 2.213776342774595e-05, + "loss": 0.7934, + "step": 3790 + }, + { + "epoch": 1.08, + "learning_rate": 2.2027339981361156e-05, + "loss": 0.7975, + "step": 3800 + }, + { + "epoch": 1.08, + "learning_rate": 2.1916975330314235e-05, + "loss": 0.807, + "step": 3810 + }, + { + "epoch": 1.08, + "learning_rate": 2.1806671657474048e-05, + "loss": 0.7754, + "step": 3820 + }, + { + "epoch": 1.08, + "learning_rate": 2.1696431144503356e-05, + "loss": 0.7977, + "step": 3830 + }, + { + "epoch": 1.09, + "learning_rate": 2.1586255971815738e-05, + "loss": 0.7922, + "step": 3840 + }, + { + "epoch": 1.09, + "learning_rate": 2.147614831853239e-05, + "loss": 0.7862, + "step": 3850 + }, + { + "epoch": 1.09, + "learning_rate": 2.136611036243908e-05, + "loss": 0.7918, + "step": 3860 + }, + { + "epoch": 1.1, + "learning_rate": 2.1256144279943066e-05, + "loss": 0.781, + "step": 3870 + }, + { + "epoch": 1.1, + "learning_rate": 2.114625224603002e-05, + "loss": 0.7786, + "step": 3880 + }, + { + "epoch": 1.1, + "learning_rate": 2.1036436434221048e-05, + "loss": 0.8067, + "step": 3890 + }, + { + "epoch": 1.1, + "learning_rate": 2.0926699016529656e-05, + "loss": 0.7755, + "step": 3900 + }, + { + "epoch": 1.11, + "learning_rate": 2.0817042163418858e-05, + "loss": 0.7958, + "step": 3910 + }, + { + "epoch": 1.11, + "learning_rate": 2.0707468043758156e-05, + "loss": 0.8064, + "step": 3920 + }, + { + "epoch": 1.11, + "learning_rate": 2.059797882478074e-05, + "loss": 0.7967, + "step": 3930 + }, + { + "epoch": 1.12, + "learning_rate": 2.048857667204053e-05, + "loss": 0.8107, + "step": 3940 + }, + { + "epoch": 1.12, + "learning_rate": 2.0379263749369434e-05, + "loss": 0.7857, + "step": 3950 + }, + { + "epoch": 1.12, + "learning_rate": 2.027004221883447e-05, + "loss": 0.7732, + "step": 3960 + }, + { + "epoch": 1.12, + "learning_rate": 2.016091424069506e-05, + "loss": 0.7768, + "step": 3970 + }, + { + "epoch": 1.13, + "learning_rate": 2.0051881973360266e-05, + "loss": 0.7839, + "step": 3980 + }, + { + "epoch": 1.13, + "learning_rate": 1.9942947573346133e-05, + "loss": 0.7923, + "step": 3990 + }, + { + "epoch": 1.13, + "learning_rate": 1.9834113195233e-05, + "loss": 0.7994, + "step": 4000 + }, + { + "epoch": 1.14, + "learning_rate": 1.9725380991622923e-05, + "loss": 0.7907, + "step": 4010 + }, + { + "epoch": 1.14, + "learning_rate": 1.961675311309705e-05, + "loss": 0.7908, + "step": 4020 + }, + { + "epoch": 1.14, + "learning_rate": 1.9508231708173146e-05, + "loss": 0.7731, + "step": 4030 + }, + { + "epoch": 1.14, + "learning_rate": 1.9399818923263056e-05, + "loss": 0.7769, + "step": 4040 + }, + { + "epoch": 1.15, + "learning_rate": 1.929151690263026e-05, + "loss": 0.795, + "step": 4050 + }, + { + "epoch": 1.15, + "learning_rate": 1.918332778834745e-05, + "loss": 0.8147, + "step": 4060 + }, + { + "epoch": 1.15, + "learning_rate": 1.9075253720254217e-05, + "loss": 0.8065, + "step": 4070 + }, + { + "epoch": 1.16, + "learning_rate": 1.8967296835914643e-05, + "loss": 0.7879, + "step": 4080 + }, + { + "epoch": 1.16, + "learning_rate": 1.885945927057511e-05, + "loss": 0.7755, + "step": 4090 + }, + { + "epoch": 1.16, + "learning_rate": 1.8751743157122003e-05, + "loss": 0.7852, + "step": 4100 + }, + { + "epoch": 1.16, + "learning_rate": 1.8644150626039534e-05, + "loss": 0.7912, + "step": 4110 + }, + { + "epoch": 1.17, + "learning_rate": 1.8536683805367656e-05, + "loss": 0.7934, + "step": 4120 + }, + { + "epoch": 1.17, + "learning_rate": 1.8429344820659892e-05, + "loss": 0.7966, + "step": 4130 + }, + { + "epoch": 1.17, + "learning_rate": 1.832213579494137e-05, + "loss": 0.7976, + "step": 4140 + }, + { + "epoch": 1.17, + "learning_rate": 1.8215058848666765e-05, + "loss": 0.7843, + "step": 4150 + }, + { + "epoch": 1.18, + "learning_rate": 1.810811609967844e-05, + "loss": 0.7848, + "step": 4160 + }, + { + "epoch": 1.18, + "learning_rate": 1.8001309663164457e-05, + "loss": 0.7675, + "step": 4170 + }, + { + "epoch": 1.18, + "learning_rate": 1.7894641651616838e-05, + "loss": 0.8059, + "step": 4180 + }, + { + "epoch": 1.19, + "learning_rate": 1.7788114174789706e-05, + "loss": 0.7871, + "step": 4190 + }, + { + "epoch": 1.19, + "learning_rate": 1.7681729339657626e-05, + "loss": 0.776, + "step": 4200 + }, + { + "epoch": 1.19, + "learning_rate": 1.7575489250373867e-05, + "loss": 0.7911, + "step": 4210 + }, + { + "epoch": 1.19, + "learning_rate": 1.746939600822883e-05, + "loss": 0.7934, + "step": 4220 + }, + { + "epoch": 1.2, + "learning_rate": 1.7363451711608445e-05, + "loss": 0.7922, + "step": 4230 + }, + { + "epoch": 1.2, + "learning_rate": 1.7257658455952747e-05, + "loss": 0.7931, + "step": 4240 + }, + { + "epoch": 1.2, + "learning_rate": 1.715201833371432e-05, + "loss": 0.7926, + "step": 4250 + }, + { + "epoch": 1.21, + "learning_rate": 1.7046533434317008e-05, + "loss": 0.7881, + "step": 4260 + }, + { + "epoch": 1.21, + "learning_rate": 1.6941205844114522e-05, + "loss": 0.7842, + "step": 4270 + }, + { + "epoch": 1.21, + "learning_rate": 1.683603764634923e-05, + "loss": 0.7807, + "step": 4280 + }, + { + "epoch": 1.21, + "learning_rate": 1.6731030921110903e-05, + "loss": 0.7926, + "step": 4290 + }, + { + "epoch": 1.22, + "learning_rate": 1.6626187745295608e-05, + "loss": 0.7878, + "step": 4300 + }, + { + "epoch": 1.22, + "learning_rate": 1.65215101925646e-05, + "loss": 0.7843, + "step": 4310 + }, + { + "epoch": 1.22, + "learning_rate": 1.641700033330336e-05, + "loss": 0.7748, + "step": 4320 + }, + { + "epoch": 1.23, + "learning_rate": 1.6312660234580585e-05, + "loss": 0.802, + "step": 4330 + }, + { + "epoch": 1.23, + "learning_rate": 1.6208491960107324e-05, + "loss": 0.7864, + "step": 4340 + }, + { + "epoch": 1.23, + "learning_rate": 1.6104497570196193e-05, + "loss": 0.7884, + "step": 4350 + }, + { + "epoch": 1.23, + "learning_rate": 1.600067912172057e-05, + "loss": 0.7832, + "step": 4360 + }, + { + "epoch": 1.24, + "learning_rate": 1.5897038668073965e-05, + "loss": 0.8039, + "step": 4370 + }, + { + "epoch": 1.24, + "learning_rate": 1.5793578259129355e-05, + "loss": 0.7737, + "step": 4380 + }, + { + "epoch": 1.24, + "learning_rate": 1.5690299941198706e-05, + "loss": 0.7844, + "step": 4390 + }, + { + "epoch": 1.25, + "learning_rate": 1.558720575699242e-05, + "loss": 0.7865, + "step": 4400 + }, + { + "epoch": 1.25, + "learning_rate": 1.548429774557901e-05, + "loss": 0.7983, + "step": 4410 + }, + { + "epoch": 1.25, + "learning_rate": 1.5381577942344688e-05, + "loss": 0.7851, + "step": 4420 + }, + { + "epoch": 1.25, + "learning_rate": 1.5279048378953222e-05, + "loss": 0.7798, + "step": 4430 + }, + { + "epoch": 1.26, + "learning_rate": 1.517671108330561e-05, + "loss": 0.79, + "step": 4440 + }, + { + "epoch": 1.26, + "learning_rate": 1.5074568079500109e-05, + "loss": 0.7694, + "step": 4450 + }, + { + "epoch": 1.26, + "learning_rate": 1.497262138779208e-05, + "loss": 0.7874, + "step": 4460 + }, + { + "epoch": 1.27, + "learning_rate": 1.4870873024554138e-05, + "loss": 0.7878, + "step": 4470 + }, + { + "epoch": 1.27, + "learning_rate": 1.4769325002236183e-05, + "loss": 0.7992, + "step": 4480 + }, + { + "epoch": 1.27, + "learning_rate": 1.4667979329325651e-05, + "loss": 0.8003, + "step": 4490 + }, + { + "epoch": 1.27, + "learning_rate": 1.4566838010307754e-05, + "loss": 0.7778, + "step": 4500 + }, + { + "epoch": 1.28, + "learning_rate": 1.4465903045625878e-05, + "loss": 0.773, + "step": 4510 + }, + { + "epoch": 1.28, + "learning_rate": 1.4365176431641958e-05, + "loss": 0.7872, + "step": 4520 + }, + { + "epoch": 1.28, + "learning_rate": 1.4264660160597057e-05, + "loss": 0.7977, + "step": 4530 + }, + { + "epoch": 1.29, + "learning_rate": 1.41643562205719e-05, + "loss": 0.7792, + "step": 4540 + }, + { + "epoch": 1.29, + "learning_rate": 1.4064266595447584e-05, + "loss": 0.7792, + "step": 4550 + }, + { + "epoch": 1.29, + "learning_rate": 1.3964393264866368e-05, + "loss": 0.7836, + "step": 4560 + }, + { + "epoch": 1.29, + "learning_rate": 1.386473820419244e-05, + "loss": 0.8005, + "step": 4570 + }, + { + "epoch": 1.3, + "learning_rate": 1.376530338447294e-05, + "loss": 0.7937, + "step": 4580 + }, + { + "epoch": 1.3, + "learning_rate": 1.366609077239889e-05, + "loss": 0.7692, + "step": 4590 + }, + { + "epoch": 1.3, + "learning_rate": 1.3567102330266369e-05, + "loss": 0.7926, + "step": 4600 + }, + { + "epoch": 1.31, + "learning_rate": 1.3468340015937642e-05, + "loss": 0.7725, + "step": 4610 + }, + { + "epoch": 1.31, + "learning_rate": 1.3369805782802467e-05, + "loss": 0.7936, + "step": 4620 + }, + { + "epoch": 1.31, + "learning_rate": 1.3271501579739449e-05, + "loss": 0.7776, + "step": 4630 + }, + { + "epoch": 1.31, + "learning_rate": 1.317342935107752e-05, + "loss": 0.7785, + "step": 4640 + }, + { + "epoch": 1.32, + "learning_rate": 1.307559103655743e-05, + "loss": 0.7735, + "step": 4650 + }, + { + "epoch": 1.32, + "learning_rate": 1.2977988571293447e-05, + "loss": 0.7925, + "step": 4660 + }, + { + "epoch": 1.32, + "learning_rate": 1.288062388573501e-05, + "loss": 0.7846, + "step": 4670 + }, + { + "epoch": 1.33, + "learning_rate": 1.2783498905628622e-05, + "loss": 0.7782, + "step": 4680 + }, + { + "epoch": 1.33, + "learning_rate": 1.2696292959503922e-05, + "loss": 0.7888, + "step": 4690 + }, + { + "epoch": 1.33, + "learning_rate": 1.2599628708177253e-05, + "loss": 0.7898, + "step": 4700 + }, + { + "epoch": 1.33, + "learning_rate": 1.250320972002072e-05, + "loss": 0.7956, + "step": 4710 + }, + { + "epoch": 1.34, + "learning_rate": 1.2407037902076168e-05, + "loss": 0.7735, + "step": 4720 + }, + { + "epoch": 1.34, + "learning_rate": 1.23111151564967e-05, + "loss": 0.7842, + "step": 4730 + }, + { + "epoch": 1.34, + "learning_rate": 1.2215443380509125e-05, + "loss": 0.7892, + "step": 4740 + }, + { + "epoch": 1.34, + "learning_rate": 1.2120024466376381e-05, + "loss": 0.7822, + "step": 4750 + }, + { + "epoch": 1.35, + "learning_rate": 1.2024860301360131e-05, + "loss": 0.7788, + "step": 4760 + }, + { + "epoch": 1.35, + "learning_rate": 1.1929952767683426e-05, + "loss": 0.7824, + "step": 4770 + }, + { + "epoch": 1.35, + "learning_rate": 1.1835303742493508e-05, + "loss": 0.7859, + "step": 4780 + }, + { + "epoch": 1.36, + "learning_rate": 1.1740915097824629e-05, + "loss": 0.7897, + "step": 4790 + }, + { + "epoch": 1.36, + "learning_rate": 1.1646788700561085e-05, + "loss": 0.768, + "step": 4800 + }, + { + "epoch": 1.36, + "learning_rate": 1.1552926412400225e-05, + "loss": 0.7935, + "step": 4810 + }, + { + "epoch": 1.36, + "learning_rate": 1.1459330089815699e-05, + "loss": 0.7933, + "step": 4820 + }, + { + "epoch": 1.37, + "learning_rate": 1.136600158402068e-05, + "loss": 0.7792, + "step": 4830 + }, + { + "epoch": 1.37, + "learning_rate": 1.1272942740931286e-05, + "loss": 0.7839, + "step": 4840 + }, + { + "epoch": 1.37, + "learning_rate": 1.1180155401130044e-05, + "loss": 0.7844, + "step": 4850 + }, + { + "epoch": 1.38, + "learning_rate": 1.1087641399829527e-05, + "loss": 0.7753, + "step": 4860 + }, + { + "epoch": 1.38, + "learning_rate": 1.0995402566835997e-05, + "loss": 0.791, + "step": 4870 + }, + { + "epoch": 1.38, + "learning_rate": 1.090344072651328e-05, + "loss": 0.7998, + "step": 4880 + }, + { + "epoch": 1.38, + "learning_rate": 1.0811757697746614e-05, + "loss": 0.7864, + "step": 4890 + }, + { + "epoch": 1.39, + "learning_rate": 1.0720355293906741e-05, + "loss": 0.7702, + "step": 4900 + }, + { + "epoch": 1.39, + "learning_rate": 1.0629235322813982e-05, + "loss": 0.7705, + "step": 4910 + }, + { + "epoch": 1.39, + "learning_rate": 1.0538399586702507e-05, + "loss": 0.7941, + "step": 4920 + }, + { + "epoch": 1.4, + "learning_rate": 1.0447849882184715e-05, + "loss": 0.7779, + "step": 4930 + }, + { + "epoch": 1.4, + "learning_rate": 1.035758800021564e-05, + "loss": 0.7755, + "step": 4940 + }, + { + "epoch": 1.4, + "learning_rate": 1.0267615726057592e-05, + "loss": 0.7825, + "step": 4950 + }, + { + "epoch": 1.4, + "learning_rate": 1.0177934839244787e-05, + "loss": 0.7983, + "step": 4960 + }, + { + "epoch": 1.41, + "learning_rate": 1.0088547113548211e-05, + "loss": 0.773, + "step": 4970 + }, + { + "epoch": 1.41, + "learning_rate": 9.99945431694048e-06, + "loss": 0.7794, + "step": 4980 + }, + { + "epoch": 1.41, + "learning_rate": 9.910658211560902e-06, + "loss": 0.7889, + "step": 4990 + }, + { + "epoch": 1.42, + "learning_rate": 9.822160553680617e-06, + "loss": 0.7809, + "step": 5000 + }, + { + "epoch": 1.42, + "learning_rate": 9.733963093667889e-06, + "loss": 0.7624, + "step": 5010 + }, + { + "epoch": 1.42, + "learning_rate": 9.646067575953419e-06, + "loss": 0.7787, + "step": 5020 + }, + { + "epoch": 1.42, + "learning_rate": 9.558475738995923e-06, + "loss": 0.775, + "step": 5030 + }, + { + "epoch": 1.43, + "learning_rate": 9.471189315247669e-06, + "loss": 0.7607, + "step": 5040 + }, + { + "epoch": 1.43, + "learning_rate": 9.384210031120288e-06, + "loss": 0.7795, + "step": 5050 + }, + { + "epoch": 1.43, + "learning_rate": 9.297539606950564e-06, + "loss": 0.7933, + "step": 5060 + }, + { + "epoch": 1.44, + "learning_rate": 9.21117975696644e-06, + "loss": 0.7859, + "step": 5070 + }, + { + "epoch": 1.44, + "learning_rate": 9.1251321892531e-06, + "loss": 0.7772, + "step": 5080 + }, + { + "epoch": 1.44, + "learning_rate": 9.039398605719215e-06, + "loss": 0.7833, + "step": 5090 + }, + { + "epoch": 1.44, + "learning_rate": 8.953980702063233e-06, + "loss": 0.7784, + "step": 5100 + }, + { + "epoch": 1.45, + "learning_rate": 8.868880167739887e-06, + "loss": 0.7835, + "step": 5110 + }, + { + "epoch": 1.45, + "learning_rate": 8.784098685926734e-06, + "loss": 0.779, + "step": 5120 + }, + { + "epoch": 1.45, + "learning_rate": 8.699637933490917e-06, + "loss": 0.7953, + "step": 5130 + }, + { + "epoch": 1.46, + "learning_rate": 8.615499580955953e-06, + "loss": 0.773, + "step": 5140 + }, + { + "epoch": 1.46, + "learning_rate": 8.531685292468693e-06, + "loss": 0.7851, + "step": 5150 + }, + { + "epoch": 1.46, + "learning_rate": 8.448196725766471e-06, + "loss": 0.7903, + "step": 5160 + }, + { + "epoch": 1.46, + "learning_rate": 8.365035532144217e-06, + "loss": 0.7822, + "step": 5170 + }, + { + "epoch": 1.47, + "learning_rate": 8.282203356421891e-06, + "loss": 0.7887, + "step": 5180 + }, + { + "epoch": 1.47, + "learning_rate": 8.199701836911877e-06, + "loss": 0.7972, + "step": 5190 + }, + { + "epoch": 1.47, + "learning_rate": 8.117532605386632e-06, + "loss": 0.7781, + "step": 5200 + }, + { + "epoch": 1.48, + "learning_rate": 8.035697287046376e-06, + "loss": 0.7885, + "step": 5210 + }, + { + "epoch": 1.48, + "learning_rate": 7.954197500486968e-06, + "loss": 0.779, + "step": 5220 + }, + { + "epoch": 1.48, + "learning_rate": 7.873034857667877e-06, + "loss": 0.779, + "step": 5230 + }, + { + "epoch": 1.48, + "learning_rate": 7.792210963880328e-06, + "loss": 0.7883, + "step": 5240 + }, + { + "epoch": 1.49, + "learning_rate": 7.711727417715509e-06, + "loss": 0.7677, + "step": 5250 + }, + { + "epoch": 1.49, + "learning_rate": 7.631585811032999e-06, + "loss": 0.7849, + "step": 5260 + }, + { + "epoch": 1.49, + "learning_rate": 7.551787728929236e-06, + "loss": 0.7707, + "step": 5270 + }, + { + "epoch": 1.49, + "learning_rate": 7.472334749706214e-06, + "loss": 0.7855, + "step": 5280 + }, + { + "epoch": 1.5, + "learning_rate": 7.393228444840228e-06, + "loss": 0.7601, + "step": 5290 + }, + { + "epoch": 1.5, + "learning_rate": 7.314470378950802e-06, + "loss": 0.7741, + "step": 5300 + }, + { + "epoch": 1.5, + "learning_rate": 7.23606210976975e-06, + "loss": 0.7733, + "step": 5310 + }, + { + "epoch": 1.51, + "learning_rate": 7.158005188110381e-06, + "loss": 0.7881, + "step": 5320 + }, + { + "epoch": 1.51, + "learning_rate": 7.080301157836783e-06, + "loss": 0.7761, + "step": 5330 + }, + { + "epoch": 1.51, + "learning_rate": 7.002951555833334e-06, + "loss": 0.7692, + "step": 5340 + }, + { + "epoch": 1.51, + "learning_rate": 6.925957911974262e-06, + "loss": 0.7656, + "step": 5350 + }, + { + "epoch": 1.52, + "learning_rate": 6.849321749093432e-06, + "loss": 0.7754, + "step": 5360 + }, + { + "epoch": 1.52, + "learning_rate": 6.773044582954172e-06, + "loss": 0.7828, + "step": 5370 + }, + { + "epoch": 1.52, + "learning_rate": 6.697127922219357e-06, + "loss": 0.779, + "step": 5380 + }, + { + "epoch": 1.53, + "learning_rate": 6.621573268421505e-06, + "loss": 0.7856, + "step": 5390 + }, + { + "epoch": 1.53, + "learning_rate": 6.546382115933117e-06, + "loss": 0.7908, + "step": 5400 + }, + { + "epoch": 1.53, + "learning_rate": 6.47155595193713e-06, + "loss": 0.7899, + "step": 5410 + }, + { + "epoch": 1.53, + "learning_rate": 6.397096256397456e-06, + "loss": 0.7736, + "step": 5420 + }, + { + "epoch": 1.54, + "learning_rate": 6.323004502029767e-06, + "loss": 0.7788, + "step": 5430 + }, + { + "epoch": 1.54, + "learning_rate": 6.249282154272315e-06, + "loss": 0.7729, + "step": 5440 + }, + { + "epoch": 1.54, + "learning_rate": 6.175930671256991e-06, + "loss": 0.7706, + "step": 5450 + }, + { + "epoch": 1.55, + "learning_rate": 6.102951503780449e-06, + "loss": 0.7915, + "step": 5460 + }, + { + "epoch": 1.55, + "learning_rate": 6.030346095275438e-06, + "loss": 0.7893, + "step": 5470 + }, + { + "epoch": 1.55, + "learning_rate": 5.958115881782228e-06, + "loss": 0.7813, + "step": 5480 + }, + { + "epoch": 1.55, + "learning_rate": 5.886262291920244e-06, + "loss": 0.793, + "step": 5490 + }, + { + "epoch": 1.56, + "learning_rate": 5.81478674685976e-06, + "loss": 0.7801, + "step": 5500 + }, + { + "epoch": 1.56, + "learning_rate": 5.7436906602938435e-06, + "loss": 0.7878, + "step": 5510 + }, + { + "epoch": 1.56, + "learning_rate": 5.672975438410344e-06, + "loss": 0.7762, + "step": 5520 + }, + { + "epoch": 1.57, + "learning_rate": 5.602642479864129e-06, + "loss": 0.7775, + "step": 5530 + }, + { + "epoch": 1.57, + "learning_rate": 5.532693175749373e-06, + "loss": 0.7689, + "step": 5540 + }, + { + "epoch": 1.57, + "learning_rate": 5.463128909572077e-06, + "loss": 0.7755, + "step": 5550 + }, + { + "epoch": 1.57, + "learning_rate": 5.393951057222685e-06, + "loss": 0.7878, + "step": 5560 + }, + { + "epoch": 1.58, + "learning_rate": 5.325160986948899e-06, + "loss": 0.7759, + "step": 5570 + }, + { + "epoch": 1.58, + "learning_rate": 5.256760059328572e-06, + "loss": 0.7698, + "step": 5580 + }, + { + "epoch": 1.58, + "learning_rate": 5.188749627242851e-06, + "loss": 0.7853, + "step": 5590 + }, + { + "epoch": 1.59, + "learning_rate": 5.121131035849361e-06, + "loss": 0.7886, + "step": 5600 + }, + { + "epoch": 1.59, + "learning_rate": 5.053905622555657e-06, + "loss": 0.7869, + "step": 5610 + }, + { + "epoch": 1.59, + "learning_rate": 4.987074716992724e-06, + "loss": 0.7882, + "step": 5620 + }, + { + "epoch": 1.59, + "learning_rate": 4.920639640988697e-06, + "loss": 0.7854, + "step": 5630 + }, + { + "epoch": 1.6, + "learning_rate": 4.854601708542747e-06, + "loss": 0.7807, + "step": 5640 + }, + { + "epoch": 1.6, + "learning_rate": 4.7889622257990205e-06, + "loss": 0.7819, + "step": 5650 + }, + { + "epoch": 1.6, + "learning_rate": 4.7237224910208935e-06, + "loss": 0.7755, + "step": 5660 + }, + { + "epoch": 1.61, + "learning_rate": 4.658883794565208e-06, + "loss": 0.7829, + "step": 5670 + }, + { + "epoch": 1.61, + "learning_rate": 4.594447418856823e-06, + "loss": 0.7761, + "step": 5680 + }, + { + "epoch": 1.61, + "learning_rate": 4.530414638363201e-06, + "loss": 0.7742, + "step": 5690 + }, + { + "epoch": 1.61, + "learning_rate": 4.466786719569221e-06, + "loss": 0.7744, + "step": 5700 + }, + { + "epoch": 1.62, + "learning_rate": 4.403564920952116e-06, + "loss": 0.78, + "step": 5710 + }, + { + "epoch": 1.62, + "learning_rate": 4.3407504929566166e-06, + "loss": 0.7847, + "step": 5720 + }, + { + "epoch": 1.62, + "learning_rate": 4.278344677970167e-06, + "loss": 0.7837, + "step": 5730 + }, + { + "epoch": 1.63, + "learning_rate": 4.216348710298401e-06, + "loss": 0.774, + "step": 5740 + }, + { + "epoch": 1.63, + "learning_rate": 4.154763816140686e-06, + "loss": 0.7826, + "step": 5750 + }, + { + "epoch": 1.63, + "learning_rate": 4.093591213565914e-06, + "loss": 0.7881, + "step": 5760 + }, + { + "epoch": 1.63, + "learning_rate": 4.032832112488369e-06, + "loss": 0.7878, + "step": 5770 + }, + { + "epoch": 1.64, + "learning_rate": 3.972487714643822e-06, + "loss": 0.7722, + "step": 5780 + }, + { + "epoch": 1.64, + "learning_rate": 3.9125592135657475e-06, + "loss": 0.7689, + "step": 5790 + }, + { + "epoch": 1.64, + "learning_rate": 3.853047794561743e-06, + "loss": 0.788, + "step": 5800 + }, + { + "epoch": 1.64, + "learning_rate": 3.7939546346900417e-06, + "loss": 0.7705, + "step": 5810 + }, + { + "epoch": 1.65, + "learning_rate": 3.7352809027362796e-06, + "loss": 0.7591, + "step": 5820 + }, + { + "epoch": 1.65, + "learning_rate": 3.6770277591903462e-06, + "loss": 0.7587, + "step": 5830 + }, + { + "epoch": 1.65, + "learning_rate": 3.619196356223439e-06, + "loss": 0.7782, + "step": 5840 + }, + { + "epoch": 1.66, + "learning_rate": 3.5617878376652785e-06, + "loss": 0.7811, + "step": 5850 + }, + { + "epoch": 1.66, + "learning_rate": 3.504803338981472e-06, + "loss": 0.786, + "step": 5860 + }, + { + "epoch": 1.66, + "learning_rate": 3.448243987251093e-06, + "loss": 0.7911, + "step": 5870 + }, + { + "epoch": 1.66, + "learning_rate": 3.3921109011443354e-06, + "loss": 0.7706, + "step": 5880 + }, + { + "epoch": 1.67, + "learning_rate": 3.336405190900438e-06, + "loss": 0.7913, + "step": 5890 + }, + { + "epoch": 1.67, + "learning_rate": 3.2811279583056825e-06, + "loss": 0.7849, + "step": 5900 + }, + { + "epoch": 1.67, + "learning_rate": 3.2262802966716383e-06, + "loss": 0.7759, + "step": 5910 + }, + { + "epoch": 1.68, + "learning_rate": 3.171863290813509e-06, + "loss": 0.8093, + "step": 5920 + }, + { + "epoch": 1.68, + "learning_rate": 3.117878017028697e-06, + "loss": 0.7634, + "step": 5930 + }, + { + "epoch": 1.68, + "learning_rate": 3.064325543075494e-06, + "loss": 0.777, + "step": 5940 + }, + { + "epoch": 1.68, + "learning_rate": 3.0112069281519994e-06, + "loss": 0.7794, + "step": 5950 + }, + { + "epoch": 1.69, + "learning_rate": 2.9585232228751204e-06, + "loss": 0.7703, + "step": 5960 + }, + { + "epoch": 1.69, + "learning_rate": 2.906275469259839e-06, + "loss": 0.7725, + "step": 5970 + }, + { + "epoch": 1.69, + "learning_rate": 2.8544647006985724e-06, + "loss": 0.7913, + "step": 5980 + }, + { + "epoch": 1.7, + "learning_rate": 2.803091941940747e-06, + "loss": 0.7897, + "step": 5990 + }, + { + "epoch": 1.7, + "learning_rate": 2.752158209072522e-06, + "loss": 0.7785, + "step": 6000 + } + ], + "max_steps": 7064, + "num_train_epochs": 2, + "total_flos": 2.125203330991076e+19, + "trial_name": null, + "trial_params": null +} diff --git a/sft-lora/checkpoint-6000/training_args.bin b/sft-lora/checkpoint-6000/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..3eed0ff4867b1994122fd7acbeae2361d0d3b65f --- /dev/null +++ b/sft-lora/checkpoint-6000/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f9990bd8d9bf61dcf0d79a1a831b0934c6cc3a114d136458fc4cdd6dc2a9387 +size 3272 diff --git a/sft-lora/checkpoint-7000/README.md b/sft-lora/checkpoint-7000/README.md new file mode 100644 index 0000000000000000000000000000000000000000..d290c902d52b2091d490255d35c9be86df84f437 --- /dev/null +++ b/sft-lora/checkpoint-7000/README.md @@ -0,0 +1,3 @@ +--- +library_name: peft +--- diff --git a/sft-lora/checkpoint-7000/adapter_config.json b/sft-lora/checkpoint-7000/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..2ef4676864a7f782259cd6700dcab8059e8973ab --- /dev/null +++ b/sft-lora/checkpoint-7000/adapter_config.json @@ -0,0 +1,20 @@ +{ + "base_model_name_or_path": "llama-13b-hf/", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layers_pattern": null, + "layers_to_transform": null, + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "revision": null, + "target_modules": [ + "q_proj", + "v_proj" + ], + "task_type": "CAUSAL_LM" +} \ No newline at end of file diff --git a/sft-lora/checkpoint-7000/adapter_model.bin b/sft-lora/checkpoint-7000/adapter_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..bfd86b21272e2f6a6d50441242efa8e596cba4a9 --- /dev/null +++ b/sft-lora/checkpoint-7000/adapter_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f6ec1cb56239dd8f3963a99654003f7d82435bcac4ee49ec070d92c26cb3c08 +size 26269517 diff --git a/sft-lora/checkpoint-7000/finetuning_args.json b/sft-lora/checkpoint-7000/finetuning_args.json new file mode 100644 index 0000000000000000000000000000000000000000..36a921b3eb84159ad54e7697e9d7d3e2fde38fec --- /dev/null +++ b/sft-lora/checkpoint-7000/finetuning_args.json @@ -0,0 +1,13 @@ +{ + "finetuning_type": "lora", + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "lora_rank": 8, + "lora_target": [ + "q_proj", + "v_proj" + ], + "name_module_trainable": "mlp", + "num_hidden_layers": 32, + "num_layer_trainable": 3 +} diff --git a/sft-lora/checkpoint-7000/optimizer.pt b/sft-lora/checkpoint-7000/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6f228392ffee78389d6906d61923efc7bb78527 --- /dev/null +++ b/sft-lora/checkpoint-7000/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24f7fd9b328ff6dcfda054d873d91e6ff96dbac45b0c36fb4011653c0c0d11d8 +size 52562821 diff --git a/sft-lora/checkpoint-7000/rng_state_0.pth b/sft-lora/checkpoint-7000/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..14de24f9400648b183a1a87d4dba0e3f1442902c --- /dev/null +++ b/sft-lora/checkpoint-7000/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a41674ee63543d3cd494c5e56b71bf7975ef6eb1a4203ce26ea6a75d229a6459 +size 18679 diff --git a/sft-lora/checkpoint-7000/rng_state_1.pth b/sft-lora/checkpoint-7000/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..0c5a3d730073587b4388351a6071e2b78385e036 --- /dev/null +++ b/sft-lora/checkpoint-7000/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef29132d00d7863f67201df64e6651ada06b7a507c18d22f83d1e0c2cb066dc8 +size 18679 diff --git a/sft-lora/checkpoint-7000/rng_state_2.pth b/sft-lora/checkpoint-7000/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..edaa68baac6eb7ac90e06e296c143671a2b426c2 --- /dev/null +++ b/sft-lora/checkpoint-7000/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5df393134b32648186b44272488442b8b7df7807c197b01a520072901355d41 +size 18679 diff --git a/sft-lora/checkpoint-7000/rng_state_3.pth b/sft-lora/checkpoint-7000/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..f2fa2e74ac9f940a3b48fc524c38c346377e88f3 --- /dev/null +++ b/sft-lora/checkpoint-7000/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29e30d7da079ef2454837d1b8adb93645add57666813a8c7589577abd4d21e21 +size 18679 diff --git a/sft-lora/checkpoint-7000/scheduler.pt b/sft-lora/checkpoint-7000/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4328d4843aba209737d3fac94c038527b2553a5 --- /dev/null +++ b/sft-lora/checkpoint-7000/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c118750b74d5b8fff99b8e7a67475a28dfc9543b920285fa34d7d14c00e052f +size 627 diff --git a/sft-lora/checkpoint-7000/trainer_state.json b/sft-lora/checkpoint-7000/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..2bd248b727d1d488c38222cee83fb5de95bb26fe --- /dev/null +++ b/sft-lora/checkpoint-7000/trainer_state.json @@ -0,0 +1,4216 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 1.9818799546998869, + "global_step": 7000, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.0, + "learning_rate": 4.9999752766303955e-05, + "loss": 1.293, + "step": 10 + }, + { + "epoch": 0.01, + "learning_rate": 4.999901107010577e-05, + "loss": 1.2584, + "step": 20 + }, + { + "epoch": 0.01, + "learning_rate": 4.999777492607524e-05, + "loss": 1.2075, + "step": 30 + }, + { + "epoch": 0.01, + "learning_rate": 4.9996044358661676e-05, + "loss": 1.1718, + "step": 40 + }, + { + "epoch": 0.01, + "learning_rate": 4.9993819402093446e-05, + "loss": 1.1483, + "step": 50 + }, + { + "epoch": 0.02, + "learning_rate": 4.999110010037728e-05, + "loss": 1.122, + "step": 60 + }, + { + "epoch": 0.02, + "learning_rate": 4.998788650729743e-05, + "loss": 1.0971, + "step": 70 + }, + { + "epoch": 0.02, + "learning_rate": 4.998417868641457e-05, + "loss": 1.0756, + "step": 80 + }, + { + "epoch": 0.03, + "learning_rate": 4.9979976711064556e-05, + "loss": 1.0673, + "step": 90 + }, + { + "epoch": 0.03, + "learning_rate": 4.9975280664357e-05, + "loss": 1.0705, + "step": 100 + }, + { + "epoch": 0.03, + "learning_rate": 4.997009063917356e-05, + "loss": 1.0673, + "step": 110 + }, + { + "epoch": 0.03, + "learning_rate": 4.996440673816617e-05, + "loss": 1.031, + "step": 120 + }, + { + "epoch": 0.04, + "learning_rate": 4.995822907375498e-05, + "loss": 1.0383, + "step": 130 + }, + { + "epoch": 0.04, + "learning_rate": 4.9951557768126136e-05, + "loss": 1.0097, + "step": 140 + }, + { + "epoch": 0.04, + "learning_rate": 4.9944392953229365e-05, + "loss": 1.012, + "step": 150 + }, + { + "epoch": 0.05, + "learning_rate": 4.993673477077535e-05, + "loss": 0.9834, + "step": 160 + }, + { + "epoch": 0.05, + "learning_rate": 4.9928583372232954e-05, + "loss": 0.9908, + "step": 170 + }, + { + "epoch": 0.05, + "learning_rate": 4.991993891882622e-05, + "loss": 0.9908, + "step": 180 + }, + { + "epoch": 0.05, + "learning_rate": 4.991080158153115e-05, + "loss": 0.9913, + "step": 190 + }, + { + "epoch": 0.06, + "learning_rate": 4.990117154107236e-05, + "loss": 0.9782, + "step": 200 + }, + { + "epoch": 0.06, + "learning_rate": 4.989104898791949e-05, + "loss": 0.9954, + "step": 210 + }, + { + "epoch": 0.06, + "learning_rate": 4.988043412228343e-05, + "loss": 0.975, + "step": 220 + }, + { + "epoch": 0.07, + "learning_rate": 4.986932715411239e-05, + "loss": 0.9687, + "step": 230 + }, + { + "epoch": 0.07, + "learning_rate": 4.985772830308771e-05, + "loss": 0.9677, + "step": 240 + }, + { + "epoch": 0.07, + "learning_rate": 4.9845637798619536e-05, + "loss": 0.9715, + "step": 250 + }, + { + "epoch": 0.07, + "learning_rate": 4.983305587984227e-05, + "loss": 0.9692, + "step": 260 + }, + { + "epoch": 0.08, + "learning_rate": 4.981998279560986e-05, + "loss": 0.9627, + "step": 270 + }, + { + "epoch": 0.08, + "learning_rate": 4.980641880449086e-05, + "loss": 0.9784, + "step": 280 + }, + { + "epoch": 0.08, + "learning_rate": 4.9792364174763323e-05, + "loss": 0.941, + "step": 290 + }, + { + "epoch": 0.08, + "learning_rate": 4.977781918440949e-05, + "loss": 0.9623, + "step": 300 + }, + { + "epoch": 0.09, + "learning_rate": 4.97627841211103e-05, + "loss": 0.9401, + "step": 310 + }, + { + "epoch": 0.09, + "learning_rate": 4.97472592822397e-05, + "loss": 0.9152, + "step": 320 + }, + { + "epoch": 0.09, + "learning_rate": 4.9731244974858746e-05, + "loss": 0.9405, + "step": 330 + }, + { + "epoch": 0.1, + "learning_rate": 4.971474151570955e-05, + "loss": 0.9431, + "step": 340 + }, + { + "epoch": 0.1, + "learning_rate": 4.9697749231209025e-05, + "loss": 0.9512, + "step": 350 + }, + { + "epoch": 0.1, + "learning_rate": 4.968026845744237e-05, + "loss": 0.9301, + "step": 360 + }, + { + "epoch": 0.1, + "learning_rate": 4.96622995401565e-05, + "loss": 0.917, + "step": 370 + }, + { + "epoch": 0.11, + "learning_rate": 4.9643842834753174e-05, + "loss": 0.9162, + "step": 380 + }, + { + "epoch": 0.11, + "learning_rate": 4.962489870628193e-05, + "loss": 0.9207, + "step": 390 + }, + { + "epoch": 0.11, + "learning_rate": 4.960546752943294e-05, + "loss": 0.924, + "step": 400 + }, + { + "epoch": 0.12, + "learning_rate": 4.958554968852952e-05, + "loss": 0.9025, + "step": 410 + }, + { + "epoch": 0.12, + "learning_rate": 4.95651455775206e-05, + "loss": 0.9027, + "step": 420 + }, + { + "epoch": 0.12, + "learning_rate": 4.954425559997287e-05, + "loss": 0.9167, + "step": 430 + }, + { + "epoch": 0.12, + "learning_rate": 4.952288016906284e-05, + "loss": 0.9119, + "step": 440 + }, + { + "epoch": 0.13, + "learning_rate": 4.9501019707568665e-05, + "loss": 0.9042, + "step": 450 + }, + { + "epoch": 0.13, + "learning_rate": 4.947867464786174e-05, + "loss": 0.9113, + "step": 460 + }, + { + "epoch": 0.13, + "learning_rate": 4.945584543189823e-05, + "loss": 0.9297, + "step": 470 + }, + { + "epoch": 0.14, + "learning_rate": 4.943253251121022e-05, + "loss": 0.9194, + "step": 480 + }, + { + "epoch": 0.14, + "learning_rate": 4.9408736346896894e-05, + "loss": 0.8978, + "step": 490 + }, + { + "epoch": 0.14, + "learning_rate": 4.938445740961534e-05, + "loss": 0.9217, + "step": 500 + }, + { + "epoch": 0.14, + "learning_rate": 4.935969617957126e-05, + "loss": 0.8997, + "step": 510 + }, + { + "epoch": 0.15, + "learning_rate": 4.93344531465095e-05, + "loss": 0.9045, + "step": 520 + }, + { + "epoch": 0.15, + "learning_rate": 4.930872880970432e-05, + "loss": 0.8985, + "step": 530 + }, + { + "epoch": 0.15, + "learning_rate": 4.9282523677949556e-05, + "loss": 0.9171, + "step": 540 + }, + { + "epoch": 0.16, + "learning_rate": 4.9255838269548524e-05, + "loss": 0.9001, + "step": 550 + }, + { + "epoch": 0.16, + "learning_rate": 4.9228673112303814e-05, + "loss": 0.8824, + "step": 560 + }, + { + "epoch": 0.16, + "learning_rate": 4.9201028743506794e-05, + "loss": 0.9046, + "step": 570 + }, + { + "epoch": 0.16, + "learning_rate": 4.917290570992702e-05, + "loss": 0.8888, + "step": 580 + }, + { + "epoch": 0.17, + "learning_rate": 4.9144304567801415e-05, + "loss": 0.889, + "step": 590 + }, + { + "epoch": 0.17, + "learning_rate": 4.911522588282327e-05, + "loss": 0.906, + "step": 600 + }, + { + "epoch": 0.17, + "learning_rate": 4.908567023013104e-05, + "loss": 0.8858, + "step": 610 + }, + { + "epoch": 0.18, + "learning_rate": 4.9055638194296994e-05, + "loss": 0.8862, + "step": 620 + }, + { + "epoch": 0.18, + "learning_rate": 4.902513036931562e-05, + "loss": 0.8983, + "step": 630 + }, + { + "epoch": 0.18, + "learning_rate": 4.89941473585919e-05, + "loss": 0.8967, + "step": 640 + }, + { + "epoch": 0.18, + "learning_rate": 4.89626897749294e-05, + "loss": 0.8925, + "step": 650 + }, + { + "epoch": 0.19, + "learning_rate": 4.893075824051807e-05, + "loss": 0.883, + "step": 660 + }, + { + "epoch": 0.19, + "learning_rate": 4.889835338692201e-05, + "loss": 0.8823, + "step": 670 + }, + { + "epoch": 0.19, + "learning_rate": 4.886547585506698e-05, + "loss": 0.8937, + "step": 680 + }, + { + "epoch": 0.2, + "learning_rate": 4.8832126295227656e-05, + "loss": 0.8695, + "step": 690 + }, + { + "epoch": 0.2, + "learning_rate": 4.879830536701485e-05, + "loss": 0.8873, + "step": 700 + }, + { + "epoch": 0.2, + "learning_rate": 4.876401373936239e-05, + "loss": 0.8862, + "step": 710 + }, + { + "epoch": 0.2, + "learning_rate": 4.8729252090513964e-05, + "loss": 0.874, + "step": 720 + }, + { + "epoch": 0.21, + "learning_rate": 4.869402110800963e-05, + "loss": 0.8834, + "step": 730 + }, + { + "epoch": 0.21, + "learning_rate": 4.865832148867228e-05, + "loss": 0.8744, + "step": 740 + }, + { + "epoch": 0.21, + "learning_rate": 4.8622153938593816e-05, + "loss": 0.876, + "step": 750 + }, + { + "epoch": 0.22, + "learning_rate": 4.8585519173121205e-05, + "loss": 0.8874, + "step": 760 + }, + { + "epoch": 0.22, + "learning_rate": 4.8548417916842324e-05, + "loss": 0.8938, + "step": 770 + }, + { + "epoch": 0.22, + "learning_rate": 4.851085090357163e-05, + "loss": 0.8855, + "step": 780 + }, + { + "epoch": 0.22, + "learning_rate": 4.847281887633565e-05, + "loss": 0.8827, + "step": 790 + }, + { + "epoch": 0.23, + "learning_rate": 4.843432258735827e-05, + "loss": 0.8736, + "step": 800 + }, + { + "epoch": 0.23, + "learning_rate": 4.839536279804589e-05, + "loss": 0.8907, + "step": 810 + }, + { + "epoch": 0.23, + "learning_rate": 4.835594027897231e-05, + "loss": 0.862, + "step": 820 + }, + { + "epoch": 0.23, + "learning_rate": 4.831605580986355e-05, + "loss": 0.8796, + "step": 830 + }, + { + "epoch": 0.24, + "learning_rate": 4.8275710179582366e-05, + "loss": 0.8745, + "step": 840 + }, + { + "epoch": 0.24, + "learning_rate": 4.823490418611273e-05, + "loss": 0.8594, + "step": 850 + }, + { + "epoch": 0.24, + "learning_rate": 4.819363863654395e-05, + "loss": 0.8839, + "step": 860 + }, + { + "epoch": 0.25, + "learning_rate": 4.8151914347054776e-05, + "loss": 0.8536, + "step": 870 + }, + { + "epoch": 0.25, + "learning_rate": 4.810973214289724e-05, + "loss": 0.8765, + "step": 880 + }, + { + "epoch": 0.25, + "learning_rate": 4.806709285838031e-05, + "loss": 0.8726, + "step": 890 + }, + { + "epoch": 0.25, + "learning_rate": 4.8023997336853434e-05, + "loss": 0.8664, + "step": 900 + }, + { + "epoch": 0.26, + "learning_rate": 4.7980446430689804e-05, + "loss": 0.8805, + "step": 910 + }, + { + "epoch": 0.26, + "learning_rate": 4.793644100126954e-05, + "loss": 0.878, + "step": 920 + }, + { + "epoch": 0.26, + "learning_rate": 4.7891981918962656e-05, + "loss": 0.8632, + "step": 930 + }, + { + "epoch": 0.27, + "learning_rate": 4.784707006311179e-05, + "loss": 0.8614, + "step": 940 + }, + { + "epoch": 0.27, + "learning_rate": 4.780170632201487e-05, + "loss": 0.8629, + "step": 950 + }, + { + "epoch": 0.27, + "learning_rate": 4.7755891592907556e-05, + "loss": 0.8635, + "step": 960 + }, + { + "epoch": 0.27, + "learning_rate": 4.7709626781945397e-05, + "loss": 0.8525, + "step": 970 + }, + { + "epoch": 0.28, + "learning_rate": 4.766291280418603e-05, + "loss": 0.8592, + "step": 980 + }, + { + "epoch": 0.28, + "learning_rate": 4.761575058357101e-05, + "loss": 0.8621, + "step": 990 + }, + { + "epoch": 0.28, + "learning_rate": 4.756814105290753e-05, + "loss": 0.8687, + "step": 1000 + }, + { + "epoch": 0.29, + "learning_rate": 4.7520085153850014e-05, + "loss": 0.8524, + "step": 1010 + }, + { + "epoch": 0.29, + "learning_rate": 4.7471583836881476e-05, + "loss": 0.8687, + "step": 1020 + }, + { + "epoch": 0.29, + "learning_rate": 4.742263806129469e-05, + "loss": 0.8505, + "step": 1030 + }, + { + "epoch": 0.29, + "learning_rate": 4.737324879517326e-05, + "loss": 0.8754, + "step": 1040 + }, + { + "epoch": 0.3, + "learning_rate": 4.732341701537245e-05, + "loss": 0.8583, + "step": 1050 + }, + { + "epoch": 0.3, + "learning_rate": 4.727314370749988e-05, + "loss": 0.8698, + "step": 1060 + }, + { + "epoch": 0.3, + "learning_rate": 4.7222429865896e-05, + "loss": 0.8661, + "step": 1070 + }, + { + "epoch": 0.31, + "learning_rate": 4.717127649361444e-05, + "loss": 0.8574, + "step": 1080 + }, + { + "epoch": 0.31, + "learning_rate": 4.71196846024022e-05, + "loss": 0.852, + "step": 1090 + }, + { + "epoch": 0.31, + "learning_rate": 4.7067655212679585e-05, + "loss": 0.8619, + "step": 1100 + }, + { + "epoch": 0.31, + "learning_rate": 4.701518935352006e-05, + "loss": 0.8632, + "step": 1110 + }, + { + "epoch": 0.32, + "learning_rate": 4.69622880626299e-05, + "loss": 0.8529, + "step": 1120 + }, + { + "epoch": 0.32, + "learning_rate": 4.690895238632762e-05, + "loss": 0.8529, + "step": 1130 + }, + { + "epoch": 0.32, + "learning_rate": 4.685518337952335e-05, + "loss": 0.8465, + "step": 1140 + }, + { + "epoch": 0.33, + "learning_rate": 4.680098210569789e-05, + "loss": 0.8604, + "step": 1150 + }, + { + "epoch": 0.33, + "learning_rate": 4.674634963688177e-05, + "loss": 0.8649, + "step": 1160 + }, + { + "epoch": 0.33, + "learning_rate": 4.669128705363394e-05, + "loss": 0.8572, + "step": 1170 + }, + { + "epoch": 0.33, + "learning_rate": 4.663579544502049e-05, + "loss": 0.8634, + "step": 1180 + }, + { + "epoch": 0.34, + "learning_rate": 4.657987590859305e-05, + "loss": 0.8478, + "step": 1190 + }, + { + "epoch": 0.34, + "learning_rate": 4.652352955036713e-05, + "loss": 0.8475, + "step": 1200 + }, + { + "epoch": 0.34, + "learning_rate": 4.646675748480019e-05, + "loss": 0.8537, + "step": 1210 + }, + { + "epoch": 0.35, + "learning_rate": 4.640956083476964e-05, + "loss": 0.8499, + "step": 1220 + }, + { + "epoch": 0.35, + "learning_rate": 4.635194073155061e-05, + "loss": 0.8467, + "step": 1230 + }, + { + "epoch": 0.35, + "learning_rate": 4.62938983147936e-05, + "loss": 0.8538, + "step": 1240 + }, + { + "epoch": 0.35, + "learning_rate": 4.62354347325019e-05, + "loss": 0.8619, + "step": 1250 + }, + { + "epoch": 0.36, + "learning_rate": 4.6176551141008916e-05, + "loss": 0.8593, + "step": 1260 + }, + { + "epoch": 0.36, + "learning_rate": 4.611724870495528e-05, + "loss": 0.8484, + "step": 1270 + }, + { + "epoch": 0.36, + "learning_rate": 4.605752859726583e-05, + "loss": 0.8395, + "step": 1280 + }, + { + "epoch": 0.37, + "learning_rate": 4.5997391999126397e-05, + "loss": 0.8547, + "step": 1290 + }, + { + "epoch": 0.37, + "learning_rate": 4.5936840099960465e-05, + "loss": 0.8586, + "step": 1300 + }, + { + "epoch": 0.37, + "learning_rate": 4.587587409740561e-05, + "loss": 0.839, + "step": 1310 + }, + { + "epoch": 0.37, + "learning_rate": 4.581449519728986e-05, + "loss": 0.8417, + "step": 1320 + }, + { + "epoch": 0.38, + "learning_rate": 4.575270461360779e-05, + "loss": 0.8404, + "step": 1330 + }, + { + "epoch": 0.38, + "learning_rate": 4.569050356849655e-05, + "loss": 0.843, + "step": 1340 + }, + { + "epoch": 0.38, + "learning_rate": 4.562789329221169e-05, + "loss": 0.8557, + "step": 1350 + }, + { + "epoch": 0.39, + "learning_rate": 4.5564875023102796e-05, + "loss": 0.8504, + "step": 1360 + }, + { + "epoch": 0.39, + "learning_rate": 4.550145000758905e-05, + "loss": 0.8579, + "step": 1370 + }, + { + "epoch": 0.39, + "learning_rate": 4.543761950013453e-05, + "loss": 0.8563, + "step": 1380 + }, + { + "epoch": 0.39, + "learning_rate": 4.537338476322341e-05, + "loss": 0.8446, + "step": 1390 + }, + { + "epoch": 0.4, + "learning_rate": 4.530874706733502e-05, + "loss": 0.8524, + "step": 1400 + }, + { + "epoch": 0.4, + "learning_rate": 4.524370769091866e-05, + "loss": 0.8417, + "step": 1410 + }, + { + "epoch": 0.4, + "learning_rate": 4.5178267920368366e-05, + "loss": 0.8582, + "step": 1420 + }, + { + "epoch": 0.4, + "learning_rate": 4.511242904999746e-05, + "loss": 0.841, + "step": 1430 + }, + { + "epoch": 0.41, + "learning_rate": 4.50461923820129e-05, + "loss": 0.8529, + "step": 1440 + }, + { + "epoch": 0.41, + "learning_rate": 4.497955922648961e-05, + "loss": 0.8545, + "step": 1450 + }, + { + "epoch": 0.41, + "learning_rate": 4.491253090134447e-05, + "loss": 0.8471, + "step": 1460 + }, + { + "epoch": 0.42, + "learning_rate": 4.4845108732310355e-05, + "loss": 0.8379, + "step": 1470 + }, + { + "epoch": 0.42, + "learning_rate": 4.4777294052909804e-05, + "loss": 0.8542, + "step": 1480 + }, + { + "epoch": 0.42, + "learning_rate": 4.470908820442873e-05, + "loss": 0.8463, + "step": 1490 + }, + { + "epoch": 0.42, + "learning_rate": 4.464049253588985e-05, + "loss": 0.8362, + "step": 1500 + }, + { + "epoch": 0.43, + "learning_rate": 4.457150840402604e-05, + "loss": 0.8467, + "step": 1510 + }, + { + "epoch": 0.43, + "learning_rate": 4.450213717325343e-05, + "loss": 0.8501, + "step": 1520 + }, + { + "epoch": 0.43, + "learning_rate": 4.443238021564448e-05, + "loss": 0.8541, + "step": 1530 + }, + { + "epoch": 0.44, + "learning_rate": 4.4362238910900835e-05, + "loss": 0.8443, + "step": 1540 + }, + { + "epoch": 0.44, + "learning_rate": 4.4291714646326024e-05, + "loss": 0.8297, + "step": 1550 + }, + { + "epoch": 0.44, + "learning_rate": 4.4220808816797995e-05, + "loss": 0.8532, + "step": 1560 + }, + { + "epoch": 0.44, + "learning_rate": 4.414952282474158e-05, + "loss": 0.854, + "step": 1570 + }, + { + "epoch": 0.45, + "learning_rate": 4.407785808010073e-05, + "loss": 0.849, + "step": 1580 + }, + { + "epoch": 0.45, + "learning_rate": 4.400581600031062e-05, + "loss": 0.8516, + "step": 1590 + }, + { + "epoch": 0.45, + "learning_rate": 4.3933398010269614e-05, + "loss": 0.8394, + "step": 1600 + }, + { + "epoch": 0.46, + "learning_rate": 4.386060554231111e-05, + "loss": 0.8399, + "step": 1610 + }, + { + "epoch": 0.46, + "learning_rate": 4.378744003617517e-05, + "loss": 0.8242, + "step": 1620 + }, + { + "epoch": 0.46, + "learning_rate": 4.371390293898007e-05, + "loss": 0.8395, + "step": 1630 + }, + { + "epoch": 0.46, + "learning_rate": 4.3639995705193684e-05, + "loss": 0.8355, + "step": 1640 + }, + { + "epoch": 0.47, + "learning_rate": 4.3565719796604706e-05, + "loss": 0.8299, + "step": 1650 + }, + { + "epoch": 0.47, + "learning_rate": 4.3491076682293715e-05, + "loss": 0.8272, + "step": 1660 + }, + { + "epoch": 0.47, + "learning_rate": 4.341606783860416e-05, + "loss": 0.8336, + "step": 1670 + }, + { + "epoch": 0.48, + "learning_rate": 4.334069474911313e-05, + "loss": 0.8264, + "step": 1680 + }, + { + "epoch": 0.48, + "learning_rate": 4.326495890460204e-05, + "loss": 0.8381, + "step": 1690 + }, + { + "epoch": 0.48, + "learning_rate": 4.3188861803027094e-05, + "loss": 0.8278, + "step": 1700 + }, + { + "epoch": 0.48, + "learning_rate": 4.3112404949489715e-05, + "loss": 0.8458, + "step": 1710 + }, + { + "epoch": 0.49, + "learning_rate": 4.303558985620673e-05, + "loss": 0.8348, + "step": 1720 + }, + { + "epoch": 0.49, + "learning_rate": 4.2958418042480506e-05, + "loss": 0.814, + "step": 1730 + }, + { + "epoch": 0.49, + "learning_rate": 4.288089103466886e-05, + "loss": 0.838, + "step": 1740 + }, + { + "epoch": 0.5, + "learning_rate": 4.280301036615489e-05, + "loss": 0.824, + "step": 1750 + }, + { + "epoch": 0.5, + "learning_rate": 4.272477757731662e-05, + "loss": 0.8314, + "step": 1760 + }, + { + "epoch": 0.5, + "learning_rate": 4.2646194215496595e-05, + "loss": 0.821, + "step": 1770 + }, + { + "epoch": 0.5, + "learning_rate": 4.2567261834971206e-05, + "loss": 0.8311, + "step": 1780 + }, + { + "epoch": 0.51, + "learning_rate": 4.248798199691998e-05, + "loss": 0.8443, + "step": 1790 + }, + { + "epoch": 0.51, + "learning_rate": 4.2408356269394714e-05, + "loss": 0.8315, + "step": 1800 + }, + { + "epoch": 0.51, + "learning_rate": 4.2328386227288445e-05, + "loss": 0.8184, + "step": 1810 + }, + { + "epoch": 0.52, + "learning_rate": 4.224807345230429e-05, + "loss": 0.8364, + "step": 1820 + }, + { + "epoch": 0.52, + "learning_rate": 4.21674195329242e-05, + "loss": 0.8186, + "step": 1830 + }, + { + "epoch": 0.52, + "learning_rate": 4.208642606437748e-05, + "loss": 0.8454, + "step": 1840 + }, + { + "epoch": 0.52, + "learning_rate": 4.2005094648609325e-05, + "loss": 0.832, + "step": 1850 + }, + { + "epoch": 0.53, + "learning_rate": 4.192342689424903e-05, + "loss": 0.8027, + "step": 1860 + }, + { + "epoch": 0.53, + "learning_rate": 4.184142441657827e-05, + "loss": 0.8365, + "step": 1870 + }, + { + "epoch": 0.53, + "learning_rate": 4.1759088837499095e-05, + "loss": 0.8523, + "step": 1880 + }, + { + "epoch": 0.54, + "learning_rate": 4.167642178550186e-05, + "loss": 0.8377, + "step": 1890 + }, + { + "epoch": 0.54, + "learning_rate": 4.159342489563304e-05, + "loss": 0.8299, + "step": 1900 + }, + { + "epoch": 0.54, + "learning_rate": 4.151009980946287e-05, + "loss": 0.8273, + "step": 1910 + }, + { + "epoch": 0.54, + "learning_rate": 4.142644817505284e-05, + "loss": 0.813, + "step": 1920 + }, + { + "epoch": 0.55, + "learning_rate": 4.1342471646923196e-05, + "loss": 0.8262, + "step": 1930 + }, + { + "epoch": 0.55, + "learning_rate": 4.1258171886020124e-05, + "loss": 0.8258, + "step": 1940 + }, + { + "epoch": 0.55, + "learning_rate": 4.117355055968295e-05, + "loss": 0.8248, + "step": 1950 + }, + { + "epoch": 0.55, + "learning_rate": 4.1088609341611135e-05, + "loss": 0.8123, + "step": 1960 + }, + { + "epoch": 0.56, + "learning_rate": 4.1003349911831166e-05, + "loss": 0.8304, + "step": 1970 + }, + { + "epoch": 0.56, + "learning_rate": 4.091777395666338e-05, + "loss": 0.849, + "step": 1980 + }, + { + "epoch": 0.56, + "learning_rate": 4.0831883168688534e-05, + "loss": 0.8255, + "step": 1990 + }, + { + "epoch": 0.57, + "learning_rate": 4.07456792467144e-05, + "loss": 0.8317, + "step": 2000 + }, + { + "epoch": 0.57, + "learning_rate": 4.065916389574211e-05, + "loss": 0.8331, + "step": 2010 + }, + { + "epoch": 0.57, + "learning_rate": 4.057233882693246e-05, + "loss": 0.8309, + "step": 2020 + }, + { + "epoch": 0.57, + "learning_rate": 4.048520575757207e-05, + "loss": 0.8117, + "step": 2030 + }, + { + "epoch": 0.58, + "learning_rate": 4.0397766411039395e-05, + "loss": 0.8155, + "step": 2040 + }, + { + "epoch": 0.58, + "learning_rate": 4.031002251677067e-05, + "loss": 0.8178, + "step": 2050 + }, + { + "epoch": 0.58, + "learning_rate": 4.022197581022567e-05, + "loss": 0.8155, + "step": 2060 + }, + { + "epoch": 0.59, + "learning_rate": 4.0133628032853435e-05, + "loss": 0.8273, + "step": 2070 + }, + { + "epoch": 0.59, + "learning_rate": 4.004498093205773e-05, + "loss": 0.8021, + "step": 2080 + }, + { + "epoch": 0.59, + "learning_rate": 3.99560362611626e-05, + "loss": 0.8374, + "step": 2090 + }, + { + "epoch": 0.59, + "learning_rate": 3.986679577937762e-05, + "loss": 0.8173, + "step": 2100 + }, + { + "epoch": 0.6, + "learning_rate": 3.9777261251763145e-05, + "loss": 0.8227, + "step": 2110 + }, + { + "epoch": 0.6, + "learning_rate": 3.9687434449195316e-05, + "loss": 0.8275, + "step": 2120 + }, + { + "epoch": 0.6, + "learning_rate": 3.959731714833115e-05, + "loss": 0.8226, + "step": 2130 + }, + { + "epoch": 0.61, + "learning_rate": 3.95069111315733e-05, + "loss": 0.815, + "step": 2140 + }, + { + "epoch": 0.61, + "learning_rate": 3.9416218187034876e-05, + "loss": 0.8306, + "step": 2150 + }, + { + "epoch": 0.61, + "learning_rate": 3.9325240108504016e-05, + "loss": 0.8424, + "step": 2160 + }, + { + "epoch": 0.61, + "learning_rate": 3.923397869540845e-05, + "loss": 0.8051, + "step": 2170 + }, + { + "epoch": 0.62, + "learning_rate": 3.91424357527799e-05, + "loss": 0.8117, + "step": 2180 + }, + { + "epoch": 0.62, + "learning_rate": 3.905061309121837e-05, + "loss": 0.8123, + "step": 2190 + }, + { + "epoch": 0.62, + "learning_rate": 3.895851252685634e-05, + "loss": 0.8038, + "step": 2200 + }, + { + "epoch": 0.63, + "learning_rate": 3.886613588132284e-05, + "loss": 0.8308, + "step": 2210 + }, + { + "epoch": 0.63, + "learning_rate": 3.877348498170743e-05, + "loss": 0.8187, + "step": 2220 + }, + { + "epoch": 0.63, + "learning_rate": 3.868056166052407e-05, + "loss": 0.8274, + "step": 2230 + }, + { + "epoch": 0.63, + "learning_rate": 3.858736775567484e-05, + "loss": 0.8171, + "step": 2240 + }, + { + "epoch": 0.64, + "learning_rate": 3.8493905110413626e-05, + "loss": 0.8213, + "step": 2250 + }, + { + "epoch": 0.64, + "learning_rate": 3.8400175573309646e-05, + "loss": 0.8241, + "step": 2260 + }, + { + "epoch": 0.64, + "learning_rate": 3.83061809982109e-05, + "loss": 0.8296, + "step": 2270 + }, + { + "epoch": 0.65, + "learning_rate": 3.821192324420747e-05, + "loss": 0.8247, + "step": 2280 + }, + { + "epoch": 0.65, + "learning_rate": 3.8117404175594795e-05, + "loss": 0.8399, + "step": 2290 + }, + { + "epoch": 0.65, + "learning_rate": 3.8022625661836775e-05, + "loss": 0.8015, + "step": 2300 + }, + { + "epoch": 0.65, + "learning_rate": 3.792758957752879e-05, + "loss": 0.8204, + "step": 2310 + }, + { + "epoch": 0.66, + "learning_rate": 3.783229780236062e-05, + "loss": 0.8198, + "step": 2320 + }, + { + "epoch": 0.66, + "learning_rate": 3.773675222107929e-05, + "loss": 0.8045, + "step": 2330 + }, + { + "epoch": 0.66, + "learning_rate": 3.7640954723451784e-05, + "loss": 0.8185, + "step": 2340 + }, + { + "epoch": 0.67, + "learning_rate": 3.7544907204227646e-05, + "loss": 0.8123, + "step": 2350 + }, + { + "epoch": 0.67, + "learning_rate": 3.7448611563101536e-05, + "loss": 0.8093, + "step": 2360 + }, + { + "epoch": 0.67, + "learning_rate": 3.735206970467564e-05, + "loss": 0.8194, + "step": 2370 + }, + { + "epoch": 0.67, + "learning_rate": 3.7255283538421984e-05, + "loss": 0.8121, + "step": 2380 + }, + { + "epoch": 0.68, + "learning_rate": 3.7158254978644703e-05, + "loss": 0.811, + "step": 2390 + }, + { + "epoch": 0.68, + "learning_rate": 3.706098594444216e-05, + "loss": 0.8013, + "step": 2400 + }, + { + "epoch": 0.68, + "learning_rate": 3.6963478359668966e-05, + "loss": 0.8215, + "step": 2410 + }, + { + "epoch": 0.69, + "learning_rate": 3.6865734152897987e-05, + "loss": 0.8079, + "step": 2420 + }, + { + "epoch": 0.69, + "learning_rate": 3.676775525738213e-05, + "loss": 0.821, + "step": 2430 + }, + { + "epoch": 0.69, + "learning_rate": 3.666954361101616e-05, + "loss": 0.8097, + "step": 2440 + }, + { + "epoch": 0.69, + "learning_rate": 3.657110115629832e-05, + "loss": 0.8046, + "step": 2450 + }, + { + "epoch": 0.7, + "learning_rate": 3.647242984029201e-05, + "loss": 0.8112, + "step": 2460 + }, + { + "epoch": 0.7, + "learning_rate": 3.637353161458713e-05, + "loss": 0.8099, + "step": 2470 + }, + { + "epoch": 0.7, + "learning_rate": 3.627440843526158e-05, + "loss": 0.8148, + "step": 2480 + }, + { + "epoch": 0.7, + "learning_rate": 3.6175062262842585e-05, + "loss": 0.8105, + "step": 2490 + }, + { + "epoch": 0.71, + "learning_rate": 3.607549506226784e-05, + "loss": 0.8132, + "step": 2500 + }, + { + "epoch": 0.71, + "learning_rate": 3.5975708802846725e-05, + "loss": 0.8149, + "step": 2510 + }, + { + "epoch": 0.71, + "learning_rate": 3.587570545822128e-05, + "loss": 0.8306, + "step": 2520 + }, + { + "epoch": 0.72, + "learning_rate": 3.5775487006327215e-05, + "loss": 0.8106, + "step": 2530 + }, + { + "epoch": 0.72, + "learning_rate": 3.567505542935482e-05, + "loss": 0.8192, + "step": 2540 + }, + { + "epoch": 0.72, + "learning_rate": 3.557441271370968e-05, + "loss": 0.8129, + "step": 2550 + }, + { + "epoch": 0.72, + "learning_rate": 3.547356084997344e-05, + "loss": 0.8155, + "step": 2560 + }, + { + "epoch": 0.73, + "learning_rate": 3.537250183286443e-05, + "loss": 0.8039, + "step": 2570 + }, + { + "epoch": 0.73, + "learning_rate": 3.527123766119818e-05, + "loss": 0.8109, + "step": 2580 + }, + { + "epoch": 0.73, + "learning_rate": 3.5169770337847935e-05, + "loss": 0.8063, + "step": 2590 + }, + { + "epoch": 0.74, + "learning_rate": 3.5068101869705004e-05, + "loss": 0.8275, + "step": 2600 + }, + { + "epoch": 0.74, + "learning_rate": 3.496623426763908e-05, + "loss": 0.8107, + "step": 2610 + }, + { + "epoch": 0.74, + "learning_rate": 3.486416954645846e-05, + "loss": 0.8047, + "step": 2620 + }, + { + "epoch": 0.74, + "learning_rate": 3.4761909724870205e-05, + "loss": 0.8123, + "step": 2630 + }, + { + "epoch": 0.75, + "learning_rate": 3.4659456825440216e-05, + "loss": 0.8241, + "step": 2640 + }, + { + "epoch": 0.75, + "learning_rate": 3.4556812874553204e-05, + "loss": 0.812, + "step": 2650 + }, + { + "epoch": 0.75, + "learning_rate": 3.445397990237264e-05, + "loss": 0.8161, + "step": 2660 + }, + { + "epoch": 0.76, + "learning_rate": 3.4350959942800584e-05, + "loss": 0.797, + "step": 2670 + }, + { + "epoch": 0.76, + "learning_rate": 3.424775503343747e-05, + "loss": 0.8155, + "step": 2680 + }, + { + "epoch": 0.76, + "learning_rate": 3.414436721554179e-05, + "loss": 0.797, + "step": 2690 + }, + { + "epoch": 0.76, + "learning_rate": 3.4040798533989745e-05, + "loss": 0.8153, + "step": 2700 + }, + { + "epoch": 0.77, + "learning_rate": 3.3937051037234745e-05, + "loss": 0.8016, + "step": 2710 + }, + { + "epoch": 0.77, + "learning_rate": 3.3833126777266974e-05, + "loss": 0.8138, + "step": 2720 + }, + { + "epoch": 0.77, + "learning_rate": 3.3729027809572735e-05, + "loss": 0.8178, + "step": 2730 + }, + { + "epoch": 0.78, + "learning_rate": 3.3624756193093835e-05, + "loss": 0.8062, + "step": 2740 + }, + { + "epoch": 0.78, + "learning_rate": 3.3520313990186856e-05, + "loss": 0.8101, + "step": 2750 + }, + { + "epoch": 0.78, + "learning_rate": 3.341570326658232e-05, + "loss": 0.7982, + "step": 2760 + }, + { + "epoch": 0.78, + "learning_rate": 3.331092609134392e-05, + "loss": 0.8021, + "step": 2770 + }, + { + "epoch": 0.79, + "learning_rate": 3.32059845368275e-05, + "loss": 0.817, + "step": 2780 + }, + { + "epoch": 0.79, + "learning_rate": 3.310088067864015e-05, + "loss": 0.8083, + "step": 2790 + }, + { + "epoch": 0.79, + "learning_rate": 3.299561659559909e-05, + "loss": 0.8047, + "step": 2800 + }, + { + "epoch": 0.8, + "learning_rate": 3.289019436969057e-05, + "loss": 0.8, + "step": 2810 + }, + { + "epoch": 0.8, + "learning_rate": 3.278461608602873e-05, + "loss": 0.8063, + "step": 2820 + }, + { + "epoch": 0.8, + "learning_rate": 3.267888383281431e-05, + "loss": 0.8139, + "step": 2830 + }, + { + "epoch": 0.8, + "learning_rate": 3.257299970129336e-05, + "loss": 0.8075, + "step": 2840 + }, + { + "epoch": 0.81, + "learning_rate": 3.246696578571592e-05, + "loss": 0.8056, + "step": 2850 + }, + { + "epoch": 0.81, + "learning_rate": 3.236078418329452e-05, + "loss": 0.8242, + "step": 2860 + }, + { + "epoch": 0.81, + "learning_rate": 3.225445699416276e-05, + "loss": 0.8041, + "step": 2870 + }, + { + "epoch": 0.82, + "learning_rate": 3.214798632133376e-05, + "loss": 0.8088, + "step": 2880 + }, + { + "epoch": 0.82, + "learning_rate": 3.204137427065857e-05, + "loss": 0.8121, + "step": 2890 + }, + { + "epoch": 0.82, + "learning_rate": 3.193462295078448e-05, + "loss": 0.8151, + "step": 2900 + }, + { + "epoch": 0.82, + "learning_rate": 3.1827734473113356e-05, + "loss": 0.8064, + "step": 2910 + }, + { + "epoch": 0.83, + "learning_rate": 3.172071095175989e-05, + "loss": 0.8151, + "step": 2920 + }, + { + "epoch": 0.83, + "learning_rate": 3.1613554503509715e-05, + "loss": 0.7942, + "step": 2930 + }, + { + "epoch": 0.83, + "learning_rate": 3.1506267247777645e-05, + "loss": 0.8131, + "step": 2940 + }, + { + "epoch": 0.84, + "learning_rate": 3.139885130656563e-05, + "loss": 0.8015, + "step": 2950 + }, + { + "epoch": 0.84, + "learning_rate": 3.129130880442091e-05, + "loss": 0.8053, + "step": 2960 + }, + { + "epoch": 0.84, + "learning_rate": 3.118364186839389e-05, + "loss": 0.7986, + "step": 2970 + }, + { + "epoch": 0.84, + "learning_rate": 3.107585262799613e-05, + "loss": 0.7936, + "step": 2980 + }, + { + "epoch": 0.85, + "learning_rate": 3.096794321515823e-05, + "loss": 0.8235, + "step": 2990 + }, + { + "epoch": 0.85, + "learning_rate": 3.0859915764187616e-05, + "loss": 0.8083, + "step": 3000 + }, + { + "epoch": 0.85, + "learning_rate": 3.075177241172637e-05, + "loss": 0.8081, + "step": 3010 + }, + { + "epoch": 0.86, + "learning_rate": 3.064351529670895e-05, + "loss": 0.7981, + "step": 3020 + }, + { + "epoch": 0.86, + "learning_rate": 3.0535146560319895e-05, + "loss": 0.8152, + "step": 3030 + }, + { + "epoch": 0.86, + "learning_rate": 3.0426668345951448e-05, + "loss": 0.8091, + "step": 3040 + }, + { + "epoch": 0.86, + "learning_rate": 3.031808279916121e-05, + "loss": 0.8206, + "step": 3050 + }, + { + "epoch": 0.87, + "learning_rate": 3.0209392067629676e-05, + "loss": 0.7947, + "step": 3060 + }, + { + "epoch": 0.87, + "learning_rate": 3.010059830111773e-05, + "loss": 0.8116, + "step": 3070 + }, + { + "epoch": 0.87, + "learning_rate": 2.9991703651424184e-05, + "loss": 0.8135, + "step": 3080 + }, + { + "epoch": 0.87, + "learning_rate": 2.988271027234317e-05, + "loss": 0.8032, + "step": 3090 + }, + { + "epoch": 0.88, + "learning_rate": 2.977362031962158e-05, + "loss": 0.8023, + "step": 3100 + }, + { + "epoch": 0.88, + "learning_rate": 2.966443595091637e-05, + "loss": 0.8116, + "step": 3110 + }, + { + "epoch": 0.88, + "learning_rate": 2.9555159325751947e-05, + "loss": 0.8048, + "step": 3120 + }, + { + "epoch": 0.89, + "learning_rate": 2.9445792605477433e-05, + "loss": 0.8032, + "step": 3130 + }, + { + "epoch": 0.89, + "learning_rate": 2.933633795322391e-05, + "loss": 0.808, + "step": 3140 + }, + { + "epoch": 0.89, + "learning_rate": 2.9226797533861615e-05, + "loss": 0.8057, + "step": 3150 + }, + { + "epoch": 0.89, + "learning_rate": 2.9117173513957186e-05, + "loss": 0.8013, + "step": 3160 + }, + { + "epoch": 0.9, + "learning_rate": 2.900746806173074e-05, + "loss": 0.802, + "step": 3170 + }, + { + "epoch": 0.9, + "learning_rate": 2.889768334701305e-05, + "loss": 0.804, + "step": 3180 + }, + { + "epoch": 0.9, + "learning_rate": 2.8787821541202564e-05, + "loss": 0.8, + "step": 3190 + }, + { + "epoch": 0.91, + "learning_rate": 2.8677884817222505e-05, + "loss": 0.7983, + "step": 3200 + }, + { + "epoch": 0.91, + "learning_rate": 2.856787534947789e-05, + "loss": 0.8083, + "step": 3210 + }, + { + "epoch": 0.91, + "learning_rate": 2.8457795313812507e-05, + "loss": 0.8203, + "step": 3220 + }, + { + "epoch": 0.91, + "learning_rate": 2.8347646887465867e-05, + "loss": 0.792, + "step": 3230 + }, + { + "epoch": 0.92, + "learning_rate": 2.8237432249030183e-05, + "loss": 0.8006, + "step": 3240 + }, + { + "epoch": 0.92, + "learning_rate": 2.812715357840725e-05, + "loss": 0.7953, + "step": 3250 + }, + { + "epoch": 0.92, + "learning_rate": 2.801681305676534e-05, + "loss": 0.8057, + "step": 3260 + }, + { + "epoch": 0.93, + "learning_rate": 2.7906412866496034e-05, + "loss": 0.8005, + "step": 3270 + }, + { + "epoch": 0.93, + "learning_rate": 2.7795955191171114e-05, + "loss": 0.8082, + "step": 3280 + }, + { + "epoch": 0.93, + "learning_rate": 2.7685442215499323e-05, + "loss": 0.811, + "step": 3290 + }, + { + "epoch": 0.93, + "learning_rate": 2.7574876125283176e-05, + "loss": 0.7981, + "step": 3300 + }, + { + "epoch": 0.94, + "learning_rate": 2.7464259107375722e-05, + "loss": 0.8018, + "step": 3310 + }, + { + "epoch": 0.94, + "learning_rate": 2.7353593349637297e-05, + "loss": 0.7991, + "step": 3320 + }, + { + "epoch": 0.94, + "learning_rate": 2.7242881040892255e-05, + "loss": 0.8057, + "step": 3330 + }, + { + "epoch": 0.95, + "learning_rate": 2.713212437088564e-05, + "loss": 0.8156, + "step": 3340 + }, + { + "epoch": 0.95, + "learning_rate": 2.702132553023993e-05, + "loss": 0.8003, + "step": 3350 + }, + { + "epoch": 0.95, + "learning_rate": 2.691048671041169e-05, + "loss": 0.7976, + "step": 3360 + }, + { + "epoch": 0.95, + "learning_rate": 2.6799610103648197e-05, + "loss": 0.7894, + "step": 3370 + }, + { + "epoch": 0.96, + "learning_rate": 2.668869790294411e-05, + "loss": 0.7953, + "step": 3380 + }, + { + "epoch": 0.96, + "learning_rate": 2.6577752301998098e-05, + "loss": 0.8124, + "step": 3390 + }, + { + "epoch": 0.96, + "learning_rate": 2.6466775495169437e-05, + "loss": 0.8073, + "step": 3400 + }, + { + "epoch": 0.97, + "learning_rate": 2.6355769677434628e-05, + "loss": 0.7979, + "step": 3410 + }, + { + "epoch": 0.97, + "learning_rate": 2.6244737044343954e-05, + "loss": 0.8023, + "step": 3420 + }, + { + "epoch": 0.97, + "learning_rate": 2.6133679791978065e-05, + "loss": 0.8046, + "step": 3430 + }, + { + "epoch": 0.97, + "learning_rate": 2.602260011690457e-05, + "loss": 0.8082, + "step": 3440 + }, + { + "epoch": 0.98, + "learning_rate": 2.591150021613456e-05, + "loss": 0.7868, + "step": 3450 + }, + { + "epoch": 0.98, + "learning_rate": 2.580038228707916e-05, + "loss": 0.7938, + "step": 3460 + }, + { + "epoch": 0.98, + "learning_rate": 2.568924852750607e-05, + "loss": 0.8215, + "step": 3470 + }, + { + "epoch": 0.99, + "learning_rate": 2.55781011354961e-05, + "loss": 0.807, + "step": 3480 + }, + { + "epoch": 0.99, + "learning_rate": 2.5466942309399706e-05, + "loss": 0.7878, + "step": 3490 + }, + { + "epoch": 0.99, + "learning_rate": 2.535577424779347e-05, + "loss": 0.7968, + "step": 3500 + }, + { + "epoch": 0.99, + "learning_rate": 2.5244599149436642e-05, + "loss": 0.787, + "step": 3510 + }, + { + "epoch": 1.0, + "learning_rate": 2.5133419213227684e-05, + "loss": 0.8011, + "step": 3520 + }, + { + "epoch": 1.0, + "learning_rate": 2.5022236638160712e-05, + "loss": 0.8086, + "step": 3530 + }, + { + "epoch": 1.0, + "learning_rate": 2.491105362328204e-05, + "loss": 0.8125, + "step": 3540 + }, + { + "epoch": 1.01, + "learning_rate": 2.4799872367646685e-05, + "loss": 0.8125, + "step": 3550 + }, + { + "epoch": 1.01, + "learning_rate": 2.468869507027486e-05, + "loss": 0.7805, + "step": 3560 + }, + { + "epoch": 1.01, + "learning_rate": 2.457752393010851e-05, + "loss": 0.817, + "step": 3570 + }, + { + "epoch": 1.01, + "learning_rate": 2.4466361145967782e-05, + "loss": 0.8056, + "step": 3580 + }, + { + "epoch": 1.02, + "learning_rate": 2.4355208916507554e-05, + "loss": 0.7752, + "step": 3590 + }, + { + "epoch": 1.02, + "learning_rate": 2.4244069440173938e-05, + "loss": 0.7749, + "step": 3600 + }, + { + "epoch": 1.02, + "learning_rate": 2.413294491516083e-05, + "loss": 0.8073, + "step": 3610 + }, + { + "epoch": 1.02, + "learning_rate": 2.402183753936639e-05, + "loss": 0.8117, + "step": 3620 + }, + { + "epoch": 1.03, + "learning_rate": 2.3910749510349574e-05, + "loss": 0.8008, + "step": 3630 + }, + { + "epoch": 1.03, + "learning_rate": 2.3799683025286727e-05, + "loss": 0.8028, + "step": 3640 + }, + { + "epoch": 1.03, + "learning_rate": 2.3688640280928043e-05, + "loss": 0.7974, + "step": 3650 + }, + { + "epoch": 1.04, + "learning_rate": 2.357762347355418e-05, + "loss": 0.7867, + "step": 3660 + }, + { + "epoch": 1.04, + "learning_rate": 2.346663479893277e-05, + "loss": 0.8002, + "step": 3670 + }, + { + "epoch": 1.04, + "learning_rate": 2.3355676452275057e-05, + "loss": 0.8095, + "step": 3680 + }, + { + "epoch": 1.04, + "learning_rate": 2.3244750628192395e-05, + "loss": 0.7847, + "step": 3690 + }, + { + "epoch": 1.05, + "learning_rate": 2.313385952065291e-05, + "loss": 0.7693, + "step": 3700 + }, + { + "epoch": 1.05, + "learning_rate": 2.302300532293806e-05, + "loss": 0.8078, + "step": 3710 + }, + { + "epoch": 1.05, + "learning_rate": 2.2912190227599305e-05, + "loss": 0.7925, + "step": 3720 + }, + { + "epoch": 1.06, + "learning_rate": 2.280141642641468e-05, + "loss": 0.77, + "step": 3730 + }, + { + "epoch": 1.06, + "learning_rate": 2.26906861103455e-05, + "loss": 0.7962, + "step": 3740 + }, + { + "epoch": 1.06, + "learning_rate": 2.2580001469492968e-05, + "loss": 0.8014, + "step": 3750 + }, + { + "epoch": 1.06, + "learning_rate": 2.2469364693054938e-05, + "loss": 0.7934, + "step": 3760 + }, + { + "epoch": 1.07, + "learning_rate": 2.235877796928252e-05, + "loss": 0.7978, + "step": 3770 + }, + { + "epoch": 1.07, + "learning_rate": 2.2248243485436892e-05, + "loss": 0.8022, + "step": 3780 + }, + { + "epoch": 1.07, + "learning_rate": 2.213776342774595e-05, + "loss": 0.7934, + "step": 3790 + }, + { + "epoch": 1.08, + "learning_rate": 2.2027339981361156e-05, + "loss": 0.7975, + "step": 3800 + }, + { + "epoch": 1.08, + "learning_rate": 2.1916975330314235e-05, + "loss": 0.807, + "step": 3810 + }, + { + "epoch": 1.08, + "learning_rate": 2.1806671657474048e-05, + "loss": 0.7754, + "step": 3820 + }, + { + "epoch": 1.08, + "learning_rate": 2.1696431144503356e-05, + "loss": 0.7977, + "step": 3830 + }, + { + "epoch": 1.09, + "learning_rate": 2.1586255971815738e-05, + "loss": 0.7922, + "step": 3840 + }, + { + "epoch": 1.09, + "learning_rate": 2.147614831853239e-05, + "loss": 0.7862, + "step": 3850 + }, + { + "epoch": 1.09, + "learning_rate": 2.136611036243908e-05, + "loss": 0.7918, + "step": 3860 + }, + { + "epoch": 1.1, + "learning_rate": 2.1256144279943066e-05, + "loss": 0.781, + "step": 3870 + }, + { + "epoch": 1.1, + "learning_rate": 2.114625224603002e-05, + "loss": 0.7786, + "step": 3880 + }, + { + "epoch": 1.1, + "learning_rate": 2.1036436434221048e-05, + "loss": 0.8067, + "step": 3890 + }, + { + "epoch": 1.1, + "learning_rate": 2.0926699016529656e-05, + "loss": 0.7755, + "step": 3900 + }, + { + "epoch": 1.11, + "learning_rate": 2.0817042163418858e-05, + "loss": 0.7958, + "step": 3910 + }, + { + "epoch": 1.11, + "learning_rate": 2.0707468043758156e-05, + "loss": 0.8064, + "step": 3920 + }, + { + "epoch": 1.11, + "learning_rate": 2.059797882478074e-05, + "loss": 0.7967, + "step": 3930 + }, + { + "epoch": 1.12, + "learning_rate": 2.048857667204053e-05, + "loss": 0.8107, + "step": 3940 + }, + { + "epoch": 1.12, + "learning_rate": 2.0379263749369434e-05, + "loss": 0.7857, + "step": 3950 + }, + { + "epoch": 1.12, + "learning_rate": 2.027004221883447e-05, + "loss": 0.7732, + "step": 3960 + }, + { + "epoch": 1.12, + "learning_rate": 2.016091424069506e-05, + "loss": 0.7768, + "step": 3970 + }, + { + "epoch": 1.13, + "learning_rate": 2.0051881973360266e-05, + "loss": 0.7839, + "step": 3980 + }, + { + "epoch": 1.13, + "learning_rate": 1.9942947573346133e-05, + "loss": 0.7923, + "step": 3990 + }, + { + "epoch": 1.13, + "learning_rate": 1.9834113195233e-05, + "loss": 0.7994, + "step": 4000 + }, + { + "epoch": 1.14, + "learning_rate": 1.9725380991622923e-05, + "loss": 0.7907, + "step": 4010 + }, + { + "epoch": 1.14, + "learning_rate": 1.961675311309705e-05, + "loss": 0.7908, + "step": 4020 + }, + { + "epoch": 1.14, + "learning_rate": 1.9508231708173146e-05, + "loss": 0.7731, + "step": 4030 + }, + { + "epoch": 1.14, + "learning_rate": 1.9399818923263056e-05, + "loss": 0.7769, + "step": 4040 + }, + { + "epoch": 1.15, + "learning_rate": 1.929151690263026e-05, + "loss": 0.795, + "step": 4050 + }, + { + "epoch": 1.15, + "learning_rate": 1.918332778834745e-05, + "loss": 0.8147, + "step": 4060 + }, + { + "epoch": 1.15, + "learning_rate": 1.9075253720254217e-05, + "loss": 0.8065, + "step": 4070 + }, + { + "epoch": 1.16, + "learning_rate": 1.8967296835914643e-05, + "loss": 0.7879, + "step": 4080 + }, + { + "epoch": 1.16, + "learning_rate": 1.885945927057511e-05, + "loss": 0.7755, + "step": 4090 + }, + { + "epoch": 1.16, + "learning_rate": 1.8751743157122003e-05, + "loss": 0.7852, + "step": 4100 + }, + { + "epoch": 1.16, + "learning_rate": 1.8644150626039534e-05, + "loss": 0.7912, + "step": 4110 + }, + { + "epoch": 1.17, + "learning_rate": 1.8536683805367656e-05, + "loss": 0.7934, + "step": 4120 + }, + { + "epoch": 1.17, + "learning_rate": 1.8429344820659892e-05, + "loss": 0.7966, + "step": 4130 + }, + { + "epoch": 1.17, + "learning_rate": 1.832213579494137e-05, + "loss": 0.7976, + "step": 4140 + }, + { + "epoch": 1.17, + "learning_rate": 1.8215058848666765e-05, + "loss": 0.7843, + "step": 4150 + }, + { + "epoch": 1.18, + "learning_rate": 1.810811609967844e-05, + "loss": 0.7848, + "step": 4160 + }, + { + "epoch": 1.18, + "learning_rate": 1.8001309663164457e-05, + "loss": 0.7675, + "step": 4170 + }, + { + "epoch": 1.18, + "learning_rate": 1.7894641651616838e-05, + "loss": 0.8059, + "step": 4180 + }, + { + "epoch": 1.19, + "learning_rate": 1.7788114174789706e-05, + "loss": 0.7871, + "step": 4190 + }, + { + "epoch": 1.19, + "learning_rate": 1.7681729339657626e-05, + "loss": 0.776, + "step": 4200 + }, + { + "epoch": 1.19, + "learning_rate": 1.7575489250373867e-05, + "loss": 0.7911, + "step": 4210 + }, + { + "epoch": 1.19, + "learning_rate": 1.746939600822883e-05, + "loss": 0.7934, + "step": 4220 + }, + { + "epoch": 1.2, + "learning_rate": 1.7363451711608445e-05, + "loss": 0.7922, + "step": 4230 + }, + { + "epoch": 1.2, + "learning_rate": 1.7257658455952747e-05, + "loss": 0.7931, + "step": 4240 + }, + { + "epoch": 1.2, + "learning_rate": 1.715201833371432e-05, + "loss": 0.7926, + "step": 4250 + }, + { + "epoch": 1.21, + "learning_rate": 1.7046533434317008e-05, + "loss": 0.7881, + "step": 4260 + }, + { + "epoch": 1.21, + "learning_rate": 1.6941205844114522e-05, + "loss": 0.7842, + "step": 4270 + }, + { + "epoch": 1.21, + "learning_rate": 1.683603764634923e-05, + "loss": 0.7807, + "step": 4280 + }, + { + "epoch": 1.21, + "learning_rate": 1.6731030921110903e-05, + "loss": 0.7926, + "step": 4290 + }, + { + "epoch": 1.22, + "learning_rate": 1.6626187745295608e-05, + "loss": 0.7878, + "step": 4300 + }, + { + "epoch": 1.22, + "learning_rate": 1.65215101925646e-05, + "loss": 0.7843, + "step": 4310 + }, + { + "epoch": 1.22, + "learning_rate": 1.641700033330336e-05, + "loss": 0.7748, + "step": 4320 + }, + { + "epoch": 1.23, + "learning_rate": 1.6312660234580585e-05, + "loss": 0.802, + "step": 4330 + }, + { + "epoch": 1.23, + "learning_rate": 1.6208491960107324e-05, + "loss": 0.7864, + "step": 4340 + }, + { + "epoch": 1.23, + "learning_rate": 1.6104497570196193e-05, + "loss": 0.7884, + "step": 4350 + }, + { + "epoch": 1.23, + "learning_rate": 1.600067912172057e-05, + "loss": 0.7832, + "step": 4360 + }, + { + "epoch": 1.24, + "learning_rate": 1.5897038668073965e-05, + "loss": 0.8039, + "step": 4370 + }, + { + "epoch": 1.24, + "learning_rate": 1.5793578259129355e-05, + "loss": 0.7737, + "step": 4380 + }, + { + "epoch": 1.24, + "learning_rate": 1.5690299941198706e-05, + "loss": 0.7844, + "step": 4390 + }, + { + "epoch": 1.25, + "learning_rate": 1.558720575699242e-05, + "loss": 0.7865, + "step": 4400 + }, + { + "epoch": 1.25, + "learning_rate": 1.548429774557901e-05, + "loss": 0.7983, + "step": 4410 + }, + { + "epoch": 1.25, + "learning_rate": 1.5381577942344688e-05, + "loss": 0.7851, + "step": 4420 + }, + { + "epoch": 1.25, + "learning_rate": 1.5279048378953222e-05, + "loss": 0.7798, + "step": 4430 + }, + { + "epoch": 1.26, + "learning_rate": 1.517671108330561e-05, + "loss": 0.79, + "step": 4440 + }, + { + "epoch": 1.26, + "learning_rate": 1.5074568079500109e-05, + "loss": 0.7694, + "step": 4450 + }, + { + "epoch": 1.26, + "learning_rate": 1.497262138779208e-05, + "loss": 0.7874, + "step": 4460 + }, + { + "epoch": 1.27, + "learning_rate": 1.4870873024554138e-05, + "loss": 0.7878, + "step": 4470 + }, + { + "epoch": 1.27, + "learning_rate": 1.4769325002236183e-05, + "loss": 0.7992, + "step": 4480 + }, + { + "epoch": 1.27, + "learning_rate": 1.4667979329325651e-05, + "loss": 0.8003, + "step": 4490 + }, + { + "epoch": 1.27, + "learning_rate": 1.4566838010307754e-05, + "loss": 0.7778, + "step": 4500 + }, + { + "epoch": 1.28, + "learning_rate": 1.4465903045625878e-05, + "loss": 0.773, + "step": 4510 + }, + { + "epoch": 1.28, + "learning_rate": 1.4365176431641958e-05, + "loss": 0.7872, + "step": 4520 + }, + { + "epoch": 1.28, + "learning_rate": 1.4264660160597057e-05, + "loss": 0.7977, + "step": 4530 + }, + { + "epoch": 1.29, + "learning_rate": 1.41643562205719e-05, + "loss": 0.7792, + "step": 4540 + }, + { + "epoch": 1.29, + "learning_rate": 1.4064266595447584e-05, + "loss": 0.7792, + "step": 4550 + }, + { + "epoch": 1.29, + "learning_rate": 1.3964393264866368e-05, + "loss": 0.7836, + "step": 4560 + }, + { + "epoch": 1.29, + "learning_rate": 1.386473820419244e-05, + "loss": 0.8005, + "step": 4570 + }, + { + "epoch": 1.3, + "learning_rate": 1.376530338447294e-05, + "loss": 0.7937, + "step": 4580 + }, + { + "epoch": 1.3, + "learning_rate": 1.366609077239889e-05, + "loss": 0.7692, + "step": 4590 + }, + { + "epoch": 1.3, + "learning_rate": 1.3567102330266369e-05, + "loss": 0.7926, + "step": 4600 + }, + { + "epoch": 1.31, + "learning_rate": 1.3468340015937642e-05, + "loss": 0.7725, + "step": 4610 + }, + { + "epoch": 1.31, + "learning_rate": 1.3369805782802467e-05, + "loss": 0.7936, + "step": 4620 + }, + { + "epoch": 1.31, + "learning_rate": 1.3271501579739449e-05, + "loss": 0.7776, + "step": 4630 + }, + { + "epoch": 1.31, + "learning_rate": 1.317342935107752e-05, + "loss": 0.7785, + "step": 4640 + }, + { + "epoch": 1.32, + "learning_rate": 1.307559103655743e-05, + "loss": 0.7735, + "step": 4650 + }, + { + "epoch": 1.32, + "learning_rate": 1.2977988571293447e-05, + "loss": 0.7925, + "step": 4660 + }, + { + "epoch": 1.32, + "learning_rate": 1.288062388573501e-05, + "loss": 0.7846, + "step": 4670 + }, + { + "epoch": 1.33, + "learning_rate": 1.2783498905628622e-05, + "loss": 0.7782, + "step": 4680 + }, + { + "epoch": 1.33, + "learning_rate": 1.2696292959503922e-05, + "loss": 0.7888, + "step": 4690 + }, + { + "epoch": 1.33, + "learning_rate": 1.2599628708177253e-05, + "loss": 0.7898, + "step": 4700 + }, + { + "epoch": 1.33, + "learning_rate": 1.250320972002072e-05, + "loss": 0.7956, + "step": 4710 + }, + { + "epoch": 1.34, + "learning_rate": 1.2407037902076168e-05, + "loss": 0.7735, + "step": 4720 + }, + { + "epoch": 1.34, + "learning_rate": 1.23111151564967e-05, + "loss": 0.7842, + "step": 4730 + }, + { + "epoch": 1.34, + "learning_rate": 1.2215443380509125e-05, + "loss": 0.7892, + "step": 4740 + }, + { + "epoch": 1.34, + "learning_rate": 1.2120024466376381e-05, + "loss": 0.7822, + "step": 4750 + }, + { + "epoch": 1.35, + "learning_rate": 1.2024860301360131e-05, + "loss": 0.7788, + "step": 4760 + }, + { + "epoch": 1.35, + "learning_rate": 1.1929952767683426e-05, + "loss": 0.7824, + "step": 4770 + }, + { + "epoch": 1.35, + "learning_rate": 1.1835303742493508e-05, + "loss": 0.7859, + "step": 4780 + }, + { + "epoch": 1.36, + "learning_rate": 1.1740915097824629e-05, + "loss": 0.7897, + "step": 4790 + }, + { + "epoch": 1.36, + "learning_rate": 1.1646788700561085e-05, + "loss": 0.768, + "step": 4800 + }, + { + "epoch": 1.36, + "learning_rate": 1.1552926412400225e-05, + "loss": 0.7935, + "step": 4810 + }, + { + "epoch": 1.36, + "learning_rate": 1.1459330089815699e-05, + "loss": 0.7933, + "step": 4820 + }, + { + "epoch": 1.37, + "learning_rate": 1.136600158402068e-05, + "loss": 0.7792, + "step": 4830 + }, + { + "epoch": 1.37, + "learning_rate": 1.1272942740931286e-05, + "loss": 0.7839, + "step": 4840 + }, + { + "epoch": 1.37, + "learning_rate": 1.1180155401130044e-05, + "loss": 0.7844, + "step": 4850 + }, + { + "epoch": 1.38, + "learning_rate": 1.1087641399829527e-05, + "loss": 0.7753, + "step": 4860 + }, + { + "epoch": 1.38, + "learning_rate": 1.0995402566835997e-05, + "loss": 0.791, + "step": 4870 + }, + { + "epoch": 1.38, + "learning_rate": 1.090344072651328e-05, + "loss": 0.7998, + "step": 4880 + }, + { + "epoch": 1.38, + "learning_rate": 1.0811757697746614e-05, + "loss": 0.7864, + "step": 4890 + }, + { + "epoch": 1.39, + "learning_rate": 1.0720355293906741e-05, + "loss": 0.7702, + "step": 4900 + }, + { + "epoch": 1.39, + "learning_rate": 1.0629235322813982e-05, + "loss": 0.7705, + "step": 4910 + }, + { + "epoch": 1.39, + "learning_rate": 1.0538399586702507e-05, + "loss": 0.7941, + "step": 4920 + }, + { + "epoch": 1.4, + "learning_rate": 1.0447849882184715e-05, + "loss": 0.7779, + "step": 4930 + }, + { + "epoch": 1.4, + "learning_rate": 1.035758800021564e-05, + "loss": 0.7755, + "step": 4940 + }, + { + "epoch": 1.4, + "learning_rate": 1.0267615726057592e-05, + "loss": 0.7825, + "step": 4950 + }, + { + "epoch": 1.4, + "learning_rate": 1.0177934839244787e-05, + "loss": 0.7983, + "step": 4960 + }, + { + "epoch": 1.41, + "learning_rate": 1.0088547113548211e-05, + "loss": 0.773, + "step": 4970 + }, + { + "epoch": 1.41, + "learning_rate": 9.99945431694048e-06, + "loss": 0.7794, + "step": 4980 + }, + { + "epoch": 1.41, + "learning_rate": 9.910658211560902e-06, + "loss": 0.7889, + "step": 4990 + }, + { + "epoch": 1.42, + "learning_rate": 9.822160553680617e-06, + "loss": 0.7809, + "step": 5000 + }, + { + "epoch": 1.42, + "learning_rate": 9.733963093667889e-06, + "loss": 0.7624, + "step": 5010 + }, + { + "epoch": 1.42, + "learning_rate": 9.646067575953419e-06, + "loss": 0.7787, + "step": 5020 + }, + { + "epoch": 1.42, + "learning_rate": 9.558475738995923e-06, + "loss": 0.775, + "step": 5030 + }, + { + "epoch": 1.43, + "learning_rate": 9.471189315247669e-06, + "loss": 0.7607, + "step": 5040 + }, + { + "epoch": 1.43, + "learning_rate": 9.384210031120288e-06, + "loss": 0.7795, + "step": 5050 + }, + { + "epoch": 1.43, + "learning_rate": 9.297539606950564e-06, + "loss": 0.7933, + "step": 5060 + }, + { + "epoch": 1.44, + "learning_rate": 9.21117975696644e-06, + "loss": 0.7859, + "step": 5070 + }, + { + "epoch": 1.44, + "learning_rate": 9.1251321892531e-06, + "loss": 0.7772, + "step": 5080 + }, + { + "epoch": 1.44, + "learning_rate": 9.039398605719215e-06, + "loss": 0.7833, + "step": 5090 + }, + { + "epoch": 1.44, + "learning_rate": 8.953980702063233e-06, + "loss": 0.7784, + "step": 5100 + }, + { + "epoch": 1.45, + "learning_rate": 8.868880167739887e-06, + "loss": 0.7835, + "step": 5110 + }, + { + "epoch": 1.45, + "learning_rate": 8.784098685926734e-06, + "loss": 0.779, + "step": 5120 + }, + { + "epoch": 1.45, + "learning_rate": 8.699637933490917e-06, + "loss": 0.7953, + "step": 5130 + }, + { + "epoch": 1.46, + "learning_rate": 8.615499580955953e-06, + "loss": 0.773, + "step": 5140 + }, + { + "epoch": 1.46, + "learning_rate": 8.531685292468693e-06, + "loss": 0.7851, + "step": 5150 + }, + { + "epoch": 1.46, + "learning_rate": 8.448196725766471e-06, + "loss": 0.7903, + "step": 5160 + }, + { + "epoch": 1.46, + "learning_rate": 8.365035532144217e-06, + "loss": 0.7822, + "step": 5170 + }, + { + "epoch": 1.47, + "learning_rate": 8.282203356421891e-06, + "loss": 0.7887, + "step": 5180 + }, + { + "epoch": 1.47, + "learning_rate": 8.199701836911877e-06, + "loss": 0.7972, + "step": 5190 + }, + { + "epoch": 1.47, + "learning_rate": 8.117532605386632e-06, + "loss": 0.7781, + "step": 5200 + }, + { + "epoch": 1.48, + "learning_rate": 8.035697287046376e-06, + "loss": 0.7885, + "step": 5210 + }, + { + "epoch": 1.48, + "learning_rate": 7.954197500486968e-06, + "loss": 0.779, + "step": 5220 + }, + { + "epoch": 1.48, + "learning_rate": 7.873034857667877e-06, + "loss": 0.779, + "step": 5230 + }, + { + "epoch": 1.48, + "learning_rate": 7.792210963880328e-06, + "loss": 0.7883, + "step": 5240 + }, + { + "epoch": 1.49, + "learning_rate": 7.711727417715509e-06, + "loss": 0.7677, + "step": 5250 + }, + { + "epoch": 1.49, + "learning_rate": 7.631585811032999e-06, + "loss": 0.7849, + "step": 5260 + }, + { + "epoch": 1.49, + "learning_rate": 7.551787728929236e-06, + "loss": 0.7707, + "step": 5270 + }, + { + "epoch": 1.49, + "learning_rate": 7.472334749706214e-06, + "loss": 0.7855, + "step": 5280 + }, + { + "epoch": 1.5, + "learning_rate": 7.393228444840228e-06, + "loss": 0.7601, + "step": 5290 + }, + { + "epoch": 1.5, + "learning_rate": 7.314470378950802e-06, + "loss": 0.7741, + "step": 5300 + }, + { + "epoch": 1.5, + "learning_rate": 7.23606210976975e-06, + "loss": 0.7733, + "step": 5310 + }, + { + "epoch": 1.51, + "learning_rate": 7.158005188110381e-06, + "loss": 0.7881, + "step": 5320 + }, + { + "epoch": 1.51, + "learning_rate": 7.080301157836783e-06, + "loss": 0.7761, + "step": 5330 + }, + { + "epoch": 1.51, + "learning_rate": 7.002951555833334e-06, + "loss": 0.7692, + "step": 5340 + }, + { + "epoch": 1.51, + "learning_rate": 6.925957911974262e-06, + "loss": 0.7656, + "step": 5350 + }, + { + "epoch": 1.52, + "learning_rate": 6.849321749093432e-06, + "loss": 0.7754, + "step": 5360 + }, + { + "epoch": 1.52, + "learning_rate": 6.773044582954172e-06, + "loss": 0.7828, + "step": 5370 + }, + { + "epoch": 1.52, + "learning_rate": 6.697127922219357e-06, + "loss": 0.779, + "step": 5380 + }, + { + "epoch": 1.53, + "learning_rate": 6.621573268421505e-06, + "loss": 0.7856, + "step": 5390 + }, + { + "epoch": 1.53, + "learning_rate": 6.546382115933117e-06, + "loss": 0.7908, + "step": 5400 + }, + { + "epoch": 1.53, + "learning_rate": 6.47155595193713e-06, + "loss": 0.7899, + "step": 5410 + }, + { + "epoch": 1.53, + "learning_rate": 6.397096256397456e-06, + "loss": 0.7736, + "step": 5420 + }, + { + "epoch": 1.54, + "learning_rate": 6.323004502029767e-06, + "loss": 0.7788, + "step": 5430 + }, + { + "epoch": 1.54, + "learning_rate": 6.249282154272315e-06, + "loss": 0.7729, + "step": 5440 + }, + { + "epoch": 1.54, + "learning_rate": 6.175930671256991e-06, + "loss": 0.7706, + "step": 5450 + }, + { + "epoch": 1.55, + "learning_rate": 6.102951503780449e-06, + "loss": 0.7915, + "step": 5460 + }, + { + "epoch": 1.55, + "learning_rate": 6.030346095275438e-06, + "loss": 0.7893, + "step": 5470 + }, + { + "epoch": 1.55, + "learning_rate": 5.958115881782228e-06, + "loss": 0.7813, + "step": 5480 + }, + { + "epoch": 1.55, + "learning_rate": 5.886262291920244e-06, + "loss": 0.793, + "step": 5490 + }, + { + "epoch": 1.56, + "learning_rate": 5.81478674685976e-06, + "loss": 0.7801, + "step": 5500 + }, + { + "epoch": 1.56, + "learning_rate": 5.7436906602938435e-06, + "loss": 0.7878, + "step": 5510 + }, + { + "epoch": 1.56, + "learning_rate": 5.672975438410344e-06, + "loss": 0.7762, + "step": 5520 + }, + { + "epoch": 1.57, + "learning_rate": 5.602642479864129e-06, + "loss": 0.7775, + "step": 5530 + }, + { + "epoch": 1.57, + "learning_rate": 5.532693175749373e-06, + "loss": 0.7689, + "step": 5540 + }, + { + "epoch": 1.57, + "learning_rate": 5.463128909572077e-06, + "loss": 0.7755, + "step": 5550 + }, + { + "epoch": 1.57, + "learning_rate": 5.393951057222685e-06, + "loss": 0.7878, + "step": 5560 + }, + { + "epoch": 1.58, + "learning_rate": 5.325160986948899e-06, + "loss": 0.7759, + "step": 5570 + }, + { + "epoch": 1.58, + "learning_rate": 5.256760059328572e-06, + "loss": 0.7698, + "step": 5580 + }, + { + "epoch": 1.58, + "learning_rate": 5.188749627242851e-06, + "loss": 0.7853, + "step": 5590 + }, + { + "epoch": 1.59, + "learning_rate": 5.121131035849361e-06, + "loss": 0.7886, + "step": 5600 + }, + { + "epoch": 1.59, + "learning_rate": 5.053905622555657e-06, + "loss": 0.7869, + "step": 5610 + }, + { + "epoch": 1.59, + "learning_rate": 4.987074716992724e-06, + "loss": 0.7882, + "step": 5620 + }, + { + "epoch": 1.59, + "learning_rate": 4.920639640988697e-06, + "loss": 0.7854, + "step": 5630 + }, + { + "epoch": 1.6, + "learning_rate": 4.854601708542747e-06, + "loss": 0.7807, + "step": 5640 + }, + { + "epoch": 1.6, + "learning_rate": 4.7889622257990205e-06, + "loss": 0.7819, + "step": 5650 + }, + { + "epoch": 1.6, + "learning_rate": 4.7237224910208935e-06, + "loss": 0.7755, + "step": 5660 + }, + { + "epoch": 1.61, + "learning_rate": 4.658883794565208e-06, + "loss": 0.7829, + "step": 5670 + }, + { + "epoch": 1.61, + "learning_rate": 4.594447418856823e-06, + "loss": 0.7761, + "step": 5680 + }, + { + "epoch": 1.61, + "learning_rate": 4.530414638363201e-06, + "loss": 0.7742, + "step": 5690 + }, + { + "epoch": 1.61, + "learning_rate": 4.466786719569221e-06, + "loss": 0.7744, + "step": 5700 + }, + { + "epoch": 1.62, + "learning_rate": 4.403564920952116e-06, + "loss": 0.78, + "step": 5710 + }, + { + "epoch": 1.62, + "learning_rate": 4.3407504929566166e-06, + "loss": 0.7847, + "step": 5720 + }, + { + "epoch": 1.62, + "learning_rate": 4.278344677970167e-06, + "loss": 0.7837, + "step": 5730 + }, + { + "epoch": 1.63, + "learning_rate": 4.216348710298401e-06, + "loss": 0.774, + "step": 5740 + }, + { + "epoch": 1.63, + "learning_rate": 4.154763816140686e-06, + "loss": 0.7826, + "step": 5750 + }, + { + "epoch": 1.63, + "learning_rate": 4.093591213565914e-06, + "loss": 0.7881, + "step": 5760 + }, + { + "epoch": 1.63, + "learning_rate": 4.032832112488369e-06, + "loss": 0.7878, + "step": 5770 + }, + { + "epoch": 1.64, + "learning_rate": 3.972487714643822e-06, + "loss": 0.7722, + "step": 5780 + }, + { + "epoch": 1.64, + "learning_rate": 3.9125592135657475e-06, + "loss": 0.7689, + "step": 5790 + }, + { + "epoch": 1.64, + "learning_rate": 3.853047794561743e-06, + "loss": 0.788, + "step": 5800 + }, + { + "epoch": 1.64, + "learning_rate": 3.7939546346900417e-06, + "loss": 0.7705, + "step": 5810 + }, + { + "epoch": 1.65, + "learning_rate": 3.7352809027362796e-06, + "loss": 0.7591, + "step": 5820 + }, + { + "epoch": 1.65, + "learning_rate": 3.6770277591903462e-06, + "loss": 0.7587, + "step": 5830 + }, + { + "epoch": 1.65, + "learning_rate": 3.619196356223439e-06, + "loss": 0.7782, + "step": 5840 + }, + { + "epoch": 1.66, + "learning_rate": 3.5617878376652785e-06, + "loss": 0.7811, + "step": 5850 + }, + { + "epoch": 1.66, + "learning_rate": 3.504803338981472e-06, + "loss": 0.786, + "step": 5860 + }, + { + "epoch": 1.66, + "learning_rate": 3.448243987251093e-06, + "loss": 0.7911, + "step": 5870 + }, + { + "epoch": 1.66, + "learning_rate": 3.3921109011443354e-06, + "loss": 0.7706, + "step": 5880 + }, + { + "epoch": 1.67, + "learning_rate": 3.336405190900438e-06, + "loss": 0.7913, + "step": 5890 + }, + { + "epoch": 1.67, + "learning_rate": 3.2811279583056825e-06, + "loss": 0.7849, + "step": 5900 + }, + { + "epoch": 1.67, + "learning_rate": 3.2262802966716383e-06, + "loss": 0.7759, + "step": 5910 + }, + { + "epoch": 1.68, + "learning_rate": 3.171863290813509e-06, + "loss": 0.8093, + "step": 5920 + }, + { + "epoch": 1.68, + "learning_rate": 3.117878017028697e-06, + "loss": 0.7634, + "step": 5930 + }, + { + "epoch": 1.68, + "learning_rate": 3.064325543075494e-06, + "loss": 0.777, + "step": 5940 + }, + { + "epoch": 1.68, + "learning_rate": 3.0112069281519994e-06, + "loss": 0.7794, + "step": 5950 + }, + { + "epoch": 1.69, + "learning_rate": 2.9585232228751204e-06, + "loss": 0.7703, + "step": 5960 + }, + { + "epoch": 1.69, + "learning_rate": 2.906275469259839e-06, + "loss": 0.7725, + "step": 5970 + }, + { + "epoch": 1.69, + "learning_rate": 2.8544647006985724e-06, + "loss": 0.7913, + "step": 5980 + }, + { + "epoch": 1.7, + "learning_rate": 2.803091941940747e-06, + "loss": 0.7897, + "step": 5990 + }, + { + "epoch": 1.7, + "learning_rate": 2.752158209072522e-06, + "loss": 0.7785, + "step": 6000 + }, + { + "epoch": 1.7, + "learning_rate": 2.701664509496701e-06, + "loss": 0.7742, + "step": 6010 + }, + { + "epoch": 1.7, + "learning_rate": 2.651611841912796e-06, + "loss": 0.7742, + "step": 6020 + }, + { + "epoch": 1.71, + "learning_rate": 2.602001196297299e-06, + "loss": 0.7947, + "step": 6030 + }, + { + "epoch": 1.71, + "learning_rate": 2.5528335538840597e-06, + "loss": 0.7842, + "step": 6040 + }, + { + "epoch": 1.71, + "learning_rate": 2.5041098871449204e-06, + "loss": 0.7738, + "step": 6050 + }, + { + "epoch": 1.72, + "learning_rate": 2.4558311597704636e-06, + "loss": 0.778, + "step": 6060 + }, + { + "epoch": 1.72, + "learning_rate": 2.40799832665094e-06, + "loss": 0.772, + "step": 6070 + }, + { + "epoch": 1.72, + "learning_rate": 2.360612333857401e-06, + "loss": 0.7742, + "step": 6080 + }, + { + "epoch": 1.72, + "learning_rate": 2.31367411862298e-06, + "loss": 0.7846, + "step": 6090 + }, + { + "epoch": 1.73, + "learning_rate": 2.2671846093243493e-06, + "loss": 0.785, + "step": 6100 + }, + { + "epoch": 1.73, + "learning_rate": 2.221144725463359e-06, + "loss": 0.7846, + "step": 6110 + }, + { + "epoch": 1.73, + "learning_rate": 2.1755553776488745e-06, + "loss": 0.797, + "step": 6120 + }, + { + "epoch": 1.74, + "learning_rate": 2.130417467578724e-06, + "loss": 0.7936, + "step": 6130 + }, + { + "epoch": 1.74, + "learning_rate": 2.0857318880218995e-06, + "loss": 0.7785, + "step": 6140 + }, + { + "epoch": 1.74, + "learning_rate": 2.0414995228008743e-06, + "loss": 0.7619, + "step": 6150 + }, + { + "epoch": 1.74, + "learning_rate": 1.997721246774145e-06, + "loss": 0.7624, + "step": 6160 + }, + { + "epoch": 1.75, + "learning_rate": 1.9543979258189126e-06, + "loss": 0.7682, + "step": 6170 + }, + { + "epoch": 1.75, + "learning_rate": 1.911530416813953e-06, + "loss": 0.7834, + "step": 6180 + }, + { + "epoch": 1.75, + "learning_rate": 1.869119567622679e-06, + "loss": 0.7947, + "step": 6190 + }, + { + "epoch": 1.76, + "learning_rate": 1.8271662170763787e-06, + "loss": 0.8014, + "step": 6200 + }, + { + "epoch": 1.76, + "learning_rate": 1.7856711949575972e-06, + "loss": 0.7769, + "step": 6210 + }, + { + "epoch": 1.76, + "learning_rate": 1.7446353219837592e-06, + "loss": 0.7804, + "step": 6220 + }, + { + "epoch": 1.76, + "learning_rate": 1.704059409790898e-06, + "loss": 0.787, + "step": 6230 + }, + { + "epoch": 1.77, + "learning_rate": 1.6639442609176409e-06, + "loss": 0.7745, + "step": 6240 + }, + { + "epoch": 1.77, + "learning_rate": 1.6242906687893077e-06, + "loss": 0.7888, + "step": 6250 + }, + { + "epoch": 1.77, + "learning_rate": 1.5850994177022265e-06, + "loss": 0.7949, + "step": 6260 + }, + { + "epoch": 1.78, + "learning_rate": 1.546371282808226e-06, + "loss": 0.7702, + "step": 6270 + }, + { + "epoch": 1.78, + "learning_rate": 1.508107030099304e-06, + "loss": 0.7911, + "step": 6280 + }, + { + "epoch": 1.78, + "learning_rate": 1.4703074163924718e-06, + "loss": 0.7807, + "step": 6290 + }, + { + "epoch": 1.78, + "learning_rate": 1.4329731893147792e-06, + "loss": 0.7797, + "step": 6300 + }, + { + "epoch": 1.79, + "learning_rate": 1.396105087288549e-06, + "loss": 0.7899, + "step": 6310 + }, + { + "epoch": 1.79, + "learning_rate": 1.3597038395167516e-06, + "loss": 0.7755, + "step": 6320 + }, + { + "epoch": 1.79, + "learning_rate": 1.3237701659685854e-06, + "loss": 0.7765, + "step": 6330 + }, + { + "epoch": 1.8, + "learning_rate": 1.28830477736524e-06, + "loss": 0.7679, + "step": 6340 + }, + { + "epoch": 1.8, + "learning_rate": 1.253308375165857e-06, + "loss": 0.7881, + "step": 6350 + }, + { + "epoch": 1.8, + "learning_rate": 1.2187816515536105e-06, + "loss": 0.78, + "step": 6360 + }, + { + "epoch": 1.8, + "learning_rate": 1.184725289422073e-06, + "loss": 0.7893, + "step": 6370 + }, + { + "epoch": 1.81, + "learning_rate": 1.151139962361658e-06, + "loss": 0.7799, + "step": 6380 + }, + { + "epoch": 1.81, + "learning_rate": 1.1180263346463327e-06, + "loss": 0.7734, + "step": 6390 + }, + { + "epoch": 1.81, + "learning_rate": 1.0853850612204646e-06, + "loss": 0.7719, + "step": 6400 + }, + { + "epoch": 1.81, + "learning_rate": 1.053216787685865e-06, + "loss": 0.7752, + "step": 6410 + }, + { + "epoch": 1.82, + "learning_rate": 1.0215221502890254e-06, + "loss": 0.7758, + "step": 6420 + }, + { + "epoch": 1.82, + "learning_rate": 9.903017759085365e-07, + "loss": 0.7696, + "step": 6430 + }, + { + "epoch": 1.82, + "learning_rate": 9.595562820426758e-07, + "loss": 0.7828, + "step": 6440 + }, + { + "epoch": 1.83, + "learning_rate": 9.292862767972199e-07, + "loss": 0.7895, + "step": 6450 + }, + { + "epoch": 1.83, + "learning_rate": 8.994923588733856e-07, + "loss": 0.7845, + "step": 6460 + }, + { + "epoch": 1.83, + "learning_rate": 8.701751175560102e-07, + "loss": 0.771, + "step": 6470 + }, + { + "epoch": 1.83, + "learning_rate": 8.41335132701887e-07, + "loss": 0.7677, + "step": 6480 + }, + { + "epoch": 1.84, + "learning_rate": 8.129729747283016e-07, + "loss": 0.786, + "step": 6490 + }, + { + "epoch": 1.84, + "learning_rate": 7.85089204601741e-07, + "loss": 0.7883, + "step": 6500 + }, + { + "epoch": 1.84, + "learning_rate": 7.576843738268113e-07, + "loss": 0.7845, + "step": 6510 + }, + { + "epoch": 1.85, + "learning_rate": 7.307590244353263e-07, + "loss": 0.7837, + "step": 6520 + }, + { + "epoch": 1.85, + "learning_rate": 7.043136889755691e-07, + "loss": 0.7697, + "step": 6530 + }, + { + "epoch": 1.85, + "learning_rate": 6.783488905017871e-07, + "loss": 0.782, + "step": 6540 + }, + { + "epoch": 1.85, + "learning_rate": 6.528651425638272e-07, + "loss": 0.7923, + "step": 6550 + }, + { + "epoch": 1.86, + "learning_rate": 6.278629491969862e-07, + "loss": 0.7745, + "step": 6560 + }, + { + "epoch": 1.86, + "learning_rate": 6.033428049120326e-07, + "loss": 0.7882, + "step": 6570 + }, + { + "epoch": 1.86, + "learning_rate": 5.793051946854422e-07, + "loss": 0.7655, + "step": 6580 + }, + { + "epoch": 1.87, + "learning_rate": 5.557505939497915e-07, + "loss": 0.7864, + "step": 6590 + }, + { + "epoch": 1.87, + "learning_rate": 5.326794685843655e-07, + "loss": 0.7793, + "step": 6600 + }, + { + "epoch": 1.87, + "learning_rate": 5.100922749059239e-07, + "loss": 0.787, + "step": 6610 + }, + { + "epoch": 1.87, + "learning_rate": 4.879894596597018e-07, + "loss": 0.7651, + "step": 6620 + }, + { + "epoch": 1.88, + "learning_rate": 4.663714600105534e-07, + "loss": 0.7677, + "step": 6630 + }, + { + "epoch": 1.88, + "learning_rate": 4.452387035343203e-07, + "loss": 0.7847, + "step": 6640 + }, + { + "epoch": 1.88, + "learning_rate": 4.2459160820935153e-07, + "loss": 0.7849, + "step": 6650 + }, + { + "epoch": 1.89, + "learning_rate": 4.044305824082717e-07, + "loss": 0.7688, + "step": 6660 + }, + { + "epoch": 1.89, + "learning_rate": 3.84756024889868e-07, + "loss": 0.7796, + "step": 6670 + }, + { + "epoch": 1.89, + "learning_rate": 3.6556832479123504e-07, + "loss": 0.762, + "step": 6680 + }, + { + "epoch": 1.89, + "learning_rate": 3.468678616200427e-07, + "loss": 0.7947, + "step": 6690 + }, + { + "epoch": 1.9, + "learning_rate": 3.2865500524707217e-07, + "loss": 0.778, + "step": 6700 + }, + { + "epoch": 1.9, + "learning_rate": 3.109301158988609e-07, + "loss": 0.7822, + "step": 6710 + }, + { + "epoch": 1.9, + "learning_rate": 2.936935441506028e-07, + "loss": 0.7796, + "step": 6720 + }, + { + "epoch": 1.91, + "learning_rate": 2.769456309192037e-07, + "loss": 0.7749, + "step": 6730 + }, + { + "epoch": 1.91, + "learning_rate": 2.6068670745654224e-07, + "loss": 0.7731, + "step": 6740 + }, + { + "epoch": 1.91, + "learning_rate": 2.449170953429225e-07, + "loss": 0.7696, + "step": 6750 + }, + { + "epoch": 1.91, + "learning_rate": 2.296371064806957e-07, + "loss": 0.7868, + "step": 6760 + }, + { + "epoch": 1.92, + "learning_rate": 2.1484704308812053e-07, + "loss": 0.7805, + "step": 6770 + }, + { + "epoch": 1.92, + "learning_rate": 2.0054719769335428e-07, + "loss": 0.7802, + "step": 6780 + }, + { + "epoch": 1.92, + "learning_rate": 1.8673785312869063e-07, + "loss": 0.7787, + "step": 6790 + }, + { + "epoch": 1.93, + "learning_rate": 1.7341928252495033e-07, + "loss": 0.7886, + "step": 6800 + }, + { + "epoch": 1.93, + "learning_rate": 1.60591749306091e-07, + "loss": 0.7902, + "step": 6810 + }, + { + "epoch": 1.93, + "learning_rate": 1.4825550718398362e-07, + "loss": 0.7577, + "step": 6820 + }, + { + "epoch": 1.93, + "learning_rate": 1.3641080015341369e-07, + "loss": 0.7703, + "step": 6830 + }, + { + "epoch": 1.94, + "learning_rate": 1.2505786248723229e-07, + "loss": 0.7588, + "step": 6840 + }, + { + "epoch": 1.94, + "learning_rate": 1.1419691873174043e-07, + "loss": 0.7651, + "step": 6850 + }, + { + "epoch": 1.94, + "learning_rate": 1.038281837022398e-07, + "loss": 0.7739, + "step": 6860 + }, + { + "epoch": 1.95, + "learning_rate": 9.395186247878329e-08, + "loss": 0.7628, + "step": 6870 + }, + { + "epoch": 1.95, + "learning_rate": 8.456815040212562e-08, + "loss": 0.7739, + "step": 6880 + }, + { + "epoch": 1.95, + "learning_rate": 7.567723306984853e-08, + "loss": 0.7889, + "step": 6890 + }, + { + "epoch": 1.95, + "learning_rate": 6.727928633270264e-08, + "loss": 0.7842, + "step": 6900 + }, + { + "epoch": 1.96, + "learning_rate": 5.937447629112414e-08, + "loss": 0.7673, + "step": 6910 + }, + { + "epoch": 1.96, + "learning_rate": 5.196295929193739e-08, + "loss": 0.7881, + "step": 6920 + }, + { + "epoch": 1.96, + "learning_rate": 4.5044881925287994e-08, + "loss": 0.7665, + "step": 6930 + }, + { + "epoch": 1.96, + "learning_rate": 3.862038102172283e-08, + "loss": 0.7724, + "step": 6940 + }, + { + "epoch": 1.97, + "learning_rate": 3.268958364948671e-08, + "loss": 0.7703, + "step": 6950 + }, + { + "epoch": 1.97, + "learning_rate": 2.7252607112018823e-08, + "loss": 0.7615, + "step": 6960 + }, + { + "epoch": 1.97, + "learning_rate": 2.2309558945621257e-08, + "loss": 0.7853, + "step": 6970 + }, + { + "epoch": 1.98, + "learning_rate": 1.7860536917341243e-08, + "loss": 0.764, + "step": 6980 + }, + { + "epoch": 1.98, + "learning_rate": 1.3905629023031052e-08, + "loss": 0.773, + "step": 6990 + }, + { + "epoch": 1.98, + "learning_rate": 1.0444913485610498e-08, + "loss": 0.7812, + "step": 7000 + } + ], + "max_steps": 7064, + "num_train_epochs": 2, + "total_flos": 2.4796030086068306e+19, + "trial_name": null, + "trial_params": null +} diff --git a/sft-lora/checkpoint-7000/training_args.bin b/sft-lora/checkpoint-7000/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..3eed0ff4867b1994122fd7acbeae2361d0d3b65f --- /dev/null +++ b/sft-lora/checkpoint-7000/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f9990bd8d9bf61dcf0d79a1a831b0934c6cc3a114d136458fc4cdd6dc2a9387 +size 3272 diff --git a/sft-lora/finetuning_args.json b/sft-lora/finetuning_args.json new file mode 100644 index 0000000000000000000000000000000000000000..36a921b3eb84159ad54e7697e9d7d3e2fde38fec --- /dev/null +++ b/sft-lora/finetuning_args.json @@ -0,0 +1,13 @@ +{ + "finetuning_type": "lora", + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "lora_rank": 8, + "lora_target": [ + "q_proj", + "v_proj" + ], + "name_module_trainable": "mlp", + "num_hidden_layers": 32, + "num_layer_trainable": 3 +} diff --git a/sft-lora/train_results.json b/sft-lora/train_results.json new file mode 100644 index 0000000000000000000000000000000000000000..04c7e4f99f6e15df1ed565949ba52b8573052183 --- /dev/null +++ b/sft-lora/train_results.json @@ -0,0 +1,7 @@ +{ + "epoch": 2.0, + "train_loss": 0.819440008492324, + "train_runtime": 68529.0816, + "train_samples_per_second": 6.597, + "train_steps_per_second": 0.103 +} \ No newline at end of file diff --git a/sft-lora/trainer_log.jsonl b/sft-lora/trainer_log.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..5a7c99adcfd3ab0cfbd9ff78b659a3455515d9db --- /dev/null +++ b/sft-lora/trainer_log.jsonl @@ -0,0 +1,2824 @@ +{"current_steps": 10, "total_steps": 7064, "loss": 1.293, "reward": null, "learning_rate": 4.9999752766303955e-05, "epoch": 0.0, "percentage": 0.14, "elapsed_time": "0:01:43", "remaining_time": "20:15:41"} +{"current_steps": 10, "total_steps": 7064, "loss": 1.293, "reward": null, "learning_rate": 4.9999752766303955e-05, "epoch": 0.0, "percentage": 0.14, "elapsed_time": "0:01:41", "remaining_time": "19:55:47"} +{"current_steps": 10, "total_steps": 7064, "loss": 1.293, "reward": null, "learning_rate": 4.9999752766303955e-05, "epoch": 0.0, "percentage": 0.14, "elapsed_time": "0:05:36", "remaining_time": "2 days, 17:54:02"} +{"current_steps": 10, "total_steps": 7064, "loss": 1.293, "reward": null, "learning_rate": 4.9999752766303955e-05, "epoch": 0.0, "percentage": 0.14, "elapsed_time": "0:01:42", "remaining_time": "20:06:23"} +{"current_steps": 20, "total_steps": 7064, "loss": 1.2584, "reward": null, "learning_rate": 4.999901107010577e-05, "epoch": 0.01, "percentage": 0.28, "elapsed_time": "0:07:04", "remaining_time": "1 day, 17:30:34"} +{"current_steps": 20, "total_steps": 7064, "loss": 1.2584, "reward": null, "learning_rate": 4.999901107010577e-05, "epoch": 0.01, "percentage": 0.28, "elapsed_time": "0:03:11", "remaining_time": "18:43:20"} +{"current_steps": 20, "total_steps": 7064, "loss": 1.2584, "reward": null, "learning_rate": 4.999901107010577e-05, "epoch": 0.01, "percentage": 0.28, "elapsed_time": "0:03:09", "remaining_time": "18:33:24"} +{"current_steps": 20, "total_steps": 7064, "loss": 1.2584, "reward": null, "learning_rate": 4.999901107010577e-05, "epoch": 0.01, "percentage": 0.28, "elapsed_time": "0:03:10", "remaining_time": "18:38:41"} +{"current_steps": 30, "total_steps": 7064, "loss": 1.2075, "reward": null, "learning_rate": 4.999777492607524e-05, "epoch": 0.01, "percentage": 0.42, "elapsed_time": "0:08:34", "remaining_time": "1 day, 9:29:13"} +{"current_steps": 30, "total_steps": 7064, "loss": 1.2075, "reward": null, "learning_rate": 4.999777492607524e-05, "epoch": 0.01, "percentage": 0.42, "elapsed_time": "0:04:40", "remaining_time": "18:15:55"} +{"current_steps": 30, "total_steps": 7064, "loss": 1.2075, "reward": null, "learning_rate": 4.999777492607524e-05, "epoch": 0.01, "percentage": 0.42, "elapsed_time": "0:04:39", "remaining_time": "18:12:24"} +{"current_steps": 30, "total_steps": 7064, "loss": 1.2075, "reward": null, "learning_rate": 4.999777492607524e-05, "epoch": 0.01, "percentage": 0.42, "elapsed_time": "0:04:41", "remaining_time": "18:19:01"} +{"current_steps": 40, "total_steps": 7064, "loss": 1.1718, "reward": null, "learning_rate": 4.9996044358661676e-05, "epoch": 0.01, "percentage": 0.57, "elapsed_time": "0:10:06", "remaining_time": "1 day, 5:34:58"} +{"current_steps": 40, "total_steps": 7064, "loss": 1.1718, "reward": null, "learning_rate": 4.9996044358661676e-05, "epoch": 0.01, "percentage": 0.57, "elapsed_time": "0:06:12", "remaining_time": "18:10:58"} +{"current_steps": 40, "total_steps": 7064, "loss": 1.1718, "reward": null, "learning_rate": 4.9996044358661676e-05, "epoch": 0.01, "percentage": 0.57, "elapsed_time": "0:06:13", "remaining_time": "18:13:17"} +{"current_steps": 40, "total_steps": 7064, "loss": 1.1718, "reward": null, "learning_rate": 4.9996044358661676e-05, "epoch": 0.01, "percentage": 0.57, "elapsed_time": "0:06:11", "remaining_time": "18:08:20"} +{"current_steps": 50, "total_steps": 7064, "loss": 1.1483, "reward": null, "learning_rate": 4.9993819402093446e-05, "epoch": 0.01, "percentage": 0.71, "elapsed_time": "0:07:45", "remaining_time": "18:08:53"} +{"current_steps": 50, "total_steps": 7064, "loss": 1.1483, "reward": null, "learning_rate": 4.9993819402093446e-05, "epoch": 0.01, "percentage": 0.71, "elapsed_time": "0:07:46", "remaining_time": "18:10:44"} +{"current_steps": 50, "total_steps": 7064, "loss": 1.1483, "reward": null, "learning_rate": 4.9993819402093446e-05, "epoch": 0.01, "percentage": 0.71, "elapsed_time": "0:07:44", "remaining_time": "18:06:47"} +{"current_steps": 50, "total_steps": 7064, "loss": 1.1483, "reward": null, "learning_rate": 4.9993819402093446e-05, "epoch": 0.01, "percentage": 0.71, "elapsed_time": "0:11:39", "remaining_time": "1 day, 3:15:18"} +{"current_steps": 60, "total_steps": 7064, "loss": 1.122, "reward": null, "learning_rate": 4.999110010037728e-05, "epoch": 0.02, "percentage": 0.85, "elapsed_time": "0:13:13", "remaining_time": "1 day, 1:44:08"} +{"current_steps": 60, "total_steps": 7064, "loss": 1.122, "reward": null, "learning_rate": 4.999110010037728e-05, "epoch": 0.02, "percentage": 0.85, "elapsed_time": "0:09:19", "remaining_time": "18:09:26"} +{"current_steps": 60, "total_steps": 7064, "loss": 1.122, "reward": null, "learning_rate": 4.999110010037728e-05, "epoch": 0.02, "percentage": 0.85, "elapsed_time": "0:09:19", "remaining_time": "18:07:41"} +{"current_steps": 60, "total_steps": 7064, "loss": 1.122, "reward": null, "learning_rate": 4.999110010037728e-05, "epoch": 0.02, "percentage": 0.85, "elapsed_time": "0:09:20", "remaining_time": "18:10:59"} +{"current_steps": 70, "total_steps": 7064, "loss": 1.0971, "reward": null, "learning_rate": 4.998788650729743e-05, "epoch": 0.02, "percentage": 0.99, "elapsed_time": "0:10:54", "remaining_time": "18:10:29"} +{"current_steps": 70, "total_steps": 7064, "loss": 1.0971, "reward": null, "learning_rate": 4.998788650729743e-05, "epoch": 0.02, "percentage": 0.99, "elapsed_time": "0:10:54", "remaining_time": "18:09:10"} +{"current_steps": 70, "total_steps": 7064, "loss": 1.0971, "reward": null, "learning_rate": 4.998788650729743e-05, "epoch": 0.02, "percentage": 0.99, "elapsed_time": "0:14:47", "remaining_time": "1 day, 0:38:21"} +{"current_steps": 70, "total_steps": 7064, "loss": 1.0971, "reward": null, "learning_rate": 4.998788650729743e-05, "epoch": 0.02, "percentage": 0.99, "elapsed_time": "0:10:53", "remaining_time": "18:07:40"} +{"current_steps": 80, "total_steps": 7064, "loss": 1.0756, "reward": null, "learning_rate": 4.998417868641457e-05, "epoch": 0.02, "percentage": 1.13, "elapsed_time": "0:12:28", "remaining_time": "18:09:16"} +{"current_steps": 80, "total_steps": 7064, "loss": 1.0756, "reward": null, "learning_rate": 4.998417868641457e-05, "epoch": 0.02, "percentage": 1.13, "elapsed_time": "0:12:29", "remaining_time": "18:10:25"} +{"current_steps": 80, "total_steps": 7064, "loss": 1.0756, "reward": null, "learning_rate": 4.998417868641457e-05, "epoch": 0.02, "percentage": 1.13, "elapsed_time": "0:12:27", "remaining_time": "18:07:57"} +{"current_steps": 80, "total_steps": 7064, "loss": 1.0756, "reward": null, "learning_rate": 4.998417868641457e-05, "epoch": 0.02, "percentage": 1.13, "elapsed_time": "0:16:22", "remaining_time": "23:49:19"} +{"current_steps": 90, "total_steps": 7064, "loss": 1.0673, "reward": null, "learning_rate": 4.9979976711064556e-05, "epoch": 0.03, "percentage": 1.27, "elapsed_time": "0:17:55", "remaining_time": "23:09:13"} +{"current_steps": 90, "total_steps": 7064, "loss": 1.0673, "reward": null, "learning_rate": 4.9979976711064556e-05, "epoch": 0.03, "percentage": 1.27, "elapsed_time": "0:14:01", "remaining_time": "18:06:14"} +{"current_steps": 90, "total_steps": 7064, "loss": 1.0673, "reward": null, "learning_rate": 4.9979976711064556e-05, "epoch": 0.03, "percentage": 1.27, "elapsed_time": "0:14:01", "remaining_time": "18:07:23"} +{"current_steps": 90, "total_steps": 7064, "loss": 1.0673, "reward": null, "learning_rate": 4.9979976711064556e-05, "epoch": 0.03, "percentage": 1.27, "elapsed_time": "0:14:02", "remaining_time": "18:08:25"} +{"current_steps": 100, "total_steps": 7064, "loss": 1.0705, "reward": null, "learning_rate": 4.9975280664357e-05, "epoch": 0.03, "percentage": 1.42, "elapsed_time": "0:19:31", "remaining_time": "22:40:11"} +{"current_steps": 100, "total_steps": 7064, "loss": 1.0705, "reward": null, "learning_rate": 4.9975280664357e-05, "epoch": 0.03, "percentage": 1.42, "elapsed_time": "0:15:38", "remaining_time": "18:09:50"} +{"current_steps": 100, "total_steps": 7064, "loss": 1.0705, "reward": null, "learning_rate": 4.9975280664357e-05, "epoch": 0.03, "percentage": 1.42, "elapsed_time": "0:15:37", "remaining_time": "18:07:52"} +{"current_steps": 100, "total_steps": 7064, "loss": 1.0705, "reward": null, "learning_rate": 4.9975280664357e-05, "epoch": 0.03, "percentage": 1.42, "elapsed_time": "0:15:38", "remaining_time": "18:08:55"} +{"current_steps": 110, "total_steps": 7064, "loss": 1.0673, "reward": null, "learning_rate": 4.997009063917356e-05, "epoch": 0.03, "percentage": 1.56, "elapsed_time": "0:21:05", "remaining_time": "22:13:22"} +{"current_steps": 110, "total_steps": 7064, "loss": 1.0673, "reward": null, "learning_rate": 4.997009063917356e-05, "epoch": 0.03, "percentage": 1.56, "elapsed_time": "0:17:10", "remaining_time": "18:06:11"} +{"current_steps": 110, "total_steps": 7064, "loss": 1.0673, "reward": null, "learning_rate": 4.997009063917356e-05, "epoch": 0.03, "percentage": 1.56, "elapsed_time": "0:17:11", "remaining_time": "18:07:07"} +{"current_steps": 110, "total_steps": 7064, "loss": 1.0673, "reward": null, "learning_rate": 4.997009063917356e-05, "epoch": 0.03, "percentage": 1.56, "elapsed_time": "0:17:12", "remaining_time": "18:07:58"} +{"current_steps": 120, "total_steps": 7064, "loss": 1.031, "reward": null, "learning_rate": 4.996440673816617e-05, "epoch": 0.03, "percentage": 1.7, "elapsed_time": "0:22:40", "remaining_time": "21:52:11"} +{"current_steps": 120, "total_steps": 7064, "loss": 1.031, "reward": null, "learning_rate": 4.996440673816617e-05, "epoch": 0.03, "percentage": 1.7, "elapsed_time": "0:18:46", "remaining_time": "18:06:47"} +{"current_steps": 120, "total_steps": 7064, "loss": 1.031, "reward": null, "learning_rate": 4.996440673816617e-05, "epoch": 0.03, "percentage": 1.7, "elapsed_time": "0:18:47", "remaining_time": "18:07:33"} +{"current_steps": 120, "total_steps": 7064, "loss": 1.031, "reward": null, "learning_rate": 4.996440673816617e-05, "epoch": 0.03, "percentage": 1.7, "elapsed_time": "0:18:45", "remaining_time": "18:05:55"} +{"current_steps": 130, "total_steps": 7064, "loss": 1.0383, "reward": null, "learning_rate": 4.995822907375498e-05, "epoch": 0.04, "percentage": 1.84, "elapsed_time": "0:20:23", "remaining_time": "18:07:37"} +{"current_steps": 130, "total_steps": 7064, "loss": 1.0383, "reward": null, "learning_rate": 4.995822907375498e-05, "epoch": 0.04, "percentage": 1.84, "elapsed_time": "0:20:22", "remaining_time": "18:06:54"} +{"current_steps": 130, "total_steps": 7064, "loss": 1.0383, "reward": null, "learning_rate": 4.995822907375498e-05, "epoch": 0.04, "percentage": 1.84, "elapsed_time": "0:20:21", "remaining_time": "18:06:06"} +{"current_steps": 130, "total_steps": 7064, "loss": 1.0383, "reward": null, "learning_rate": 4.995822907375498e-05, "epoch": 0.04, "percentage": 1.84, "elapsed_time": "0:24:16", "remaining_time": "21:34:40"} +{"current_steps": 140, "total_steps": 7064, "loss": 1.0097, "reward": null, "learning_rate": 4.9951557768126136e-05, "epoch": 0.04, "percentage": 1.98, "elapsed_time": "0:25:49", "remaining_time": "21:17:38"} +{"current_steps": 140, "total_steps": 7064, "loss": 1.0097, "reward": null, "learning_rate": 4.9951557768126136e-05, "epoch": 0.04, "percentage": 1.98, "elapsed_time": "0:21:55", "remaining_time": "18:04:15"} +{"current_steps": 140, "total_steps": 7064, "loss": 1.0097, "reward": null, "learning_rate": 4.9951557768126136e-05, "epoch": 0.04, "percentage": 1.98, "elapsed_time": "0:21:57", "remaining_time": "18:05:38"} +{"current_steps": 140, "total_steps": 7064, "loss": 1.0097, "reward": null, "learning_rate": 4.9951557768126136e-05, "epoch": 0.04, "percentage": 1.98, "elapsed_time": "0:21:56", "remaining_time": "18:04:59"} +{"current_steps": 150, "total_steps": 7064, "loss": 1.012, "reward": null, "learning_rate": 4.9944392953229365e-05, "epoch": 0.04, "percentage": 2.12, "elapsed_time": "0:23:32", "remaining_time": "18:04:56"} +{"current_steps": 150, "total_steps": 7064, "loss": 1.012, "reward": null, "learning_rate": 4.9944392953229365e-05, "epoch": 0.04, "percentage": 2.12, "elapsed_time": "0:27:25", "remaining_time": "21:04:28"} +{"current_steps": 150, "total_steps": 7064, "loss": 1.012, "reward": null, "learning_rate": 4.9944392953229365e-05, "epoch": 0.04, "percentage": 2.12, "elapsed_time": "0:23:33", "remaining_time": "18:05:32"} +{"current_steps": 150, "total_steps": 7064, "loss": 1.012, "reward": null, "learning_rate": 4.9944392953229365e-05, "epoch": 0.04, "percentage": 2.12, "elapsed_time": "0:23:31", "remaining_time": "18:04:14"} +{"current_steps": 160, "total_steps": 7064, "loss": 0.9834, "reward": null, "learning_rate": 4.993673477077535e-05, "epoch": 0.05, "percentage": 2.27, "elapsed_time": "0:25:11", "remaining_time": "18:07:14"} +{"current_steps": 160, "total_steps": 7064, "loss": 0.9834, "reward": null, "learning_rate": 4.993673477077535e-05, "epoch": 0.05, "percentage": 2.27, "elapsed_time": "0:29:05", "remaining_time": "20:55:18"} +{"current_steps": 160, "total_steps": 7064, "loss": 0.9834, "reward": null, "learning_rate": 4.993673477077535e-05, "epoch": 0.05, "percentage": 2.27, "elapsed_time": "0:25:12", "remaining_time": "18:07:48"} +{"current_steps": 160, "total_steps": 7064, "loss": 0.9834, "reward": null, "learning_rate": 4.993673477077535e-05, "epoch": 0.05, "percentage": 2.27, "elapsed_time": "0:25:10", "remaining_time": "18:06:35"} +{"current_steps": 170, "total_steps": 7064, "loss": 0.9908, "reward": null, "learning_rate": 4.9928583372232954e-05, "epoch": 0.05, "percentage": 2.41, "elapsed_time": "0:30:41", "remaining_time": "20:44:34"} +{"current_steps": 170, "total_steps": 7064, "loss": 0.9908, "reward": null, "learning_rate": 4.9928583372232954e-05, "epoch": 0.05, "percentage": 2.41, "elapsed_time": "0:26:46", "remaining_time": "18:06:00"} +{"current_steps": 170, "total_steps": 7064, "loss": 0.9908, "reward": null, "learning_rate": 4.9928583372232954e-05, "epoch": 0.05, "percentage": 2.41, "elapsed_time": "0:26:48", "remaining_time": "18:07:08"} +{"current_steps": 170, "total_steps": 7064, "loss": 0.9908, "reward": null, "learning_rate": 4.9928583372232954e-05, "epoch": 0.05, "percentage": 2.41, "elapsed_time": "0:26:47", "remaining_time": "18:06:36"} +{"current_steps": 180, "total_steps": 7064, "loss": 0.9908, "reward": null, "learning_rate": 4.991993891882622e-05, "epoch": 0.05, "percentage": 2.55, "elapsed_time": "0:32:16", "remaining_time": "20:34:38"} +{"current_steps": 180, "total_steps": 7064, "loss": 0.9908, "reward": null, "learning_rate": 4.991993891882622e-05, "epoch": 0.05, "percentage": 2.55, "elapsed_time": "0:28:24", "remaining_time": "18:06:10"} +{"current_steps": 180, "total_steps": 7064, "loss": 0.9908, "reward": null, "learning_rate": 4.991993891882622e-05, "epoch": 0.05, "percentage": 2.55, "elapsed_time": "0:28:23", "remaining_time": "18:05:40"} +{"current_steps": 180, "total_steps": 7064, "loss": 0.9908, "reward": null, "learning_rate": 4.991993891882622e-05, "epoch": 0.05, "percentage": 2.55, "elapsed_time": "0:28:22", "remaining_time": "18:05:05"} +{"current_steps": 190, "total_steps": 7064, "loss": 0.9913, "reward": null, "learning_rate": 4.991080158153115e-05, "epoch": 0.05, "percentage": 2.69, "elapsed_time": "0:29:57", "remaining_time": "18:03:41"} +{"current_steps": 190, "total_steps": 7064, "loss": 0.9913, "reward": null, "learning_rate": 4.991080158153115e-05, "epoch": 0.05, "percentage": 2.69, "elapsed_time": "0:29:58", "remaining_time": "18:04:13"} +{"current_steps": 190, "total_steps": 7064, "loss": 0.9913, "reward": null, "learning_rate": 4.991080158153115e-05, "epoch": 0.05, "percentage": 2.69, "elapsed_time": "0:29:58", "remaining_time": "18:04:42"} +{"current_steps": 190, "total_steps": 7064, "loss": 0.9913, "reward": null, "learning_rate": 4.991080158153115e-05, "epoch": 0.05, "percentage": 2.69, "elapsed_time": "0:33:51", "remaining_time": "20:25:09"} +{"current_steps": 200, "total_steps": 7064, "loss": 0.9782, "reward": null, "learning_rate": 4.990117154107236e-05, "epoch": 0.06, "percentage": 2.83, "elapsed_time": "0:35:28", "remaining_time": "20:17:15"} +{"current_steps": 200, "total_steps": 7064, "loss": 0.9782, "reward": null, "learning_rate": 4.990117154107236e-05, "epoch": 0.06, "percentage": 2.83, "elapsed_time": "0:31:34", "remaining_time": "18:03:34"} +{"current_steps": 200, "total_steps": 7064, "loss": 0.9782, "reward": null, "learning_rate": 4.990117154107236e-05, "epoch": 0.06, "percentage": 2.83, "elapsed_time": "0:31:35", "remaining_time": "18:04:01"} +{"current_steps": 200, "total_steps": 7064, "loss": 0.9782, "reward": null, "learning_rate": 4.990117154107236e-05, "epoch": 0.06, "percentage": 2.83, "elapsed_time": "0:31:33", "remaining_time": "18:03:03"} +{"current_steps": 210, "total_steps": 7064, "loss": 0.9954, "reward": null, "learning_rate": 4.989104898791949e-05, "epoch": 0.06, "percentage": 2.97, "elapsed_time": "0:37:02", "remaining_time": "20:09:06"} +{"current_steps": 210, "total_steps": 7064, "loss": 0.9954, "reward": null, "learning_rate": 4.989104898791949e-05, "epoch": 0.06, "percentage": 2.97, "elapsed_time": "0:33:09", "remaining_time": "18:02:24"} +{"current_steps": 210, "total_steps": 7064, "loss": 0.9954, "reward": null, "learning_rate": 4.989104898791949e-05, "epoch": 0.06, "percentage": 2.97, "elapsed_time": "0:33:08", "remaining_time": "18:01:29"} +{"current_steps": 210, "total_steps": 7064, "loss": 0.9954, "reward": null, "learning_rate": 4.989104898791949e-05, "epoch": 0.06, "percentage": 2.97, "elapsed_time": "0:33:09", "remaining_time": "18:01:58"} +{"current_steps": 220, "total_steps": 7064, "loss": 0.975, "reward": null, "learning_rate": 4.988043412228343e-05, "epoch": 0.06, "percentage": 3.11, "elapsed_time": "0:38:35", "remaining_time": "20:00:40"} +{"current_steps": 220, "total_steps": 7064, "loss": 0.975, "reward": null, "learning_rate": 4.988043412228343e-05, "epoch": 0.06, "percentage": 3.11, "elapsed_time": "0:34:42", "remaining_time": "17:59:54"} +{"current_steps": 220, "total_steps": 7064, "loss": 0.975, "reward": null, "learning_rate": 4.988043412228343e-05, "epoch": 0.06, "percentage": 3.11, "elapsed_time": "0:34:42", "remaining_time": "17:59:29"} +{"current_steps": 220, "total_steps": 7064, "loss": 0.975, "reward": null, "learning_rate": 4.988043412228343e-05, "epoch": 0.06, "percentage": 3.11, "elapsed_time": "0:34:41", "remaining_time": "17:59:01"} +{"current_steps": 230, "total_steps": 7064, "loss": 0.9687, "reward": null, "learning_rate": 4.986932715411239e-05, "epoch": 0.07, "percentage": 3.26, "elapsed_time": "0:40:09", "remaining_time": "19:53:08"} +{"current_steps": 230, "total_steps": 7064, "loss": 0.9687, "reward": null, "learning_rate": 4.986932715411239e-05, "epoch": 0.07, "percentage": 3.26, "elapsed_time": "0:36:15", "remaining_time": "17:57:24"} +{"current_steps": 230, "total_steps": 7064, "loss": 0.9687, "reward": null, "learning_rate": 4.986932715411239e-05, "epoch": 0.07, "percentage": 3.26, "elapsed_time": "0:36:14", "remaining_time": "17:56:57"} +{"current_steps": 230, "total_steps": 7064, "loss": 0.9687, "reward": null, "learning_rate": 4.986932715411239e-05, "epoch": 0.07, "percentage": 3.26, "elapsed_time": "0:36:16", "remaining_time": "17:57:48"} +{"current_steps": 240, "total_steps": 7064, "loss": 0.9677, "reward": null, "learning_rate": 4.985772830308771e-05, "epoch": 0.07, "percentage": 3.4, "elapsed_time": "0:41:45", "remaining_time": "19:47:19"} +{"current_steps": 240, "total_steps": 7064, "loss": 0.9677, "reward": null, "learning_rate": 4.985772830308771e-05, "epoch": 0.07, "percentage": 3.4, "elapsed_time": "0:37:52", "remaining_time": "17:56:57"} +{"current_steps": 240, "total_steps": 7064, "loss": 0.9677, "reward": null, "learning_rate": 4.985772830308771e-05, "epoch": 0.07, "percentage": 3.4, "elapsed_time": "0:37:50", "remaining_time": "17:56:09"} +{"current_steps": 240, "total_steps": 7064, "loss": 0.9677, "reward": null, "learning_rate": 4.985772830308771e-05, "epoch": 0.07, "percentage": 3.4, "elapsed_time": "0:37:51", "remaining_time": "17:56:34"} +{"current_steps": 250, "total_steps": 7064, "loss": 0.9715, "reward": null, "learning_rate": 4.9845637798619536e-05, "epoch": 0.07, "percentage": 3.54, "elapsed_time": "0:43:21", "remaining_time": "19:41:32"} +{"current_steps": 250, "total_steps": 7064, "loss": 0.9715, "reward": null, "learning_rate": 4.9845637798619536e-05, "epoch": 0.07, "percentage": 3.54, "elapsed_time": "0:39:28", "remaining_time": "17:55:44"} +{"current_steps": 250, "total_steps": 7064, "loss": 0.9715, "reward": null, "learning_rate": 4.9845637798619536e-05, "epoch": 0.07, "percentage": 3.54, "elapsed_time": "0:39:26", "remaining_time": "17:54:58"} +{"current_steps": 250, "total_steps": 7064, "loss": 0.9715, "reward": null, "learning_rate": 4.9845637798619536e-05, "epoch": 0.07, "percentage": 3.54, "elapsed_time": "0:39:27", "remaining_time": "17:55:22"} +{"current_steps": 260, "total_steps": 7064, "loss": 0.9692, "reward": null, "learning_rate": 4.983305587984227e-05, "epoch": 0.07, "percentage": 3.68, "elapsed_time": "0:44:54", "remaining_time": "19:35:19"} +{"current_steps": 260, "total_steps": 7064, "loss": 0.9692, "reward": null, "learning_rate": 4.983305587984227e-05, "epoch": 0.07, "percentage": 3.68, "elapsed_time": "0:41:01", "remaining_time": "17:53:44"} +{"current_steps": 260, "total_steps": 7064, "loss": 0.9692, "reward": null, "learning_rate": 4.983305587984227e-05, "epoch": 0.07, "percentage": 3.68, "elapsed_time": "0:41:00", "remaining_time": "17:53:00"} +{"current_steps": 260, "total_steps": 7064, "loss": 0.9692, "reward": null, "learning_rate": 4.983305587984227e-05, "epoch": 0.07, "percentage": 3.68, "elapsed_time": "0:41:01", "remaining_time": "17:53:23"} +{"current_steps": 270, "total_steps": 7064, "loss": 0.9627, "reward": null, "learning_rate": 4.981998279560986e-05, "epoch": 0.08, "percentage": 3.82, "elapsed_time": "0:42:33", "remaining_time": "17:51:05"} +{"current_steps": 270, "total_steps": 7064, "loss": 0.9627, "reward": null, "learning_rate": 4.981998279560986e-05, "epoch": 0.08, "percentage": 3.82, "elapsed_time": "0:42:34", "remaining_time": "17:51:25"} +{"current_steps": 270, "total_steps": 7064, "loss": 0.9627, "reward": null, "learning_rate": 4.981998279560986e-05, "epoch": 0.08, "percentage": 3.82, "elapsed_time": "0:42:33", "remaining_time": "17:50:42"} +{"current_steps": 270, "total_steps": 7064, "loss": 0.9627, "reward": null, "learning_rate": 4.981998279560986e-05, "epoch": 0.08, "percentage": 3.82, "elapsed_time": "0:46:27", "remaining_time": "19:29:06"} +{"current_steps": 280, "total_steps": 7064, "loss": 0.9784, "reward": null, "learning_rate": 4.980641880449086e-05, "epoch": 0.08, "percentage": 3.96, "elapsed_time": "0:48:01", "remaining_time": "19:23:32"} +{"current_steps": 280, "total_steps": 7064, "loss": 0.9784, "reward": null, "learning_rate": 4.980641880449086e-05, "epoch": 0.08, "percentage": 3.96, "elapsed_time": "0:44:07", "remaining_time": "17:49:10"} +{"current_steps": 280, "total_steps": 7064, "loss": 0.9784, "reward": null, "learning_rate": 4.980641880449086e-05, "epoch": 0.08, "percentage": 3.96, "elapsed_time": "0:44:06", "remaining_time": "17:48:48"} +{"current_steps": 280, "total_steps": 7064, "loss": 0.9784, "reward": null, "learning_rate": 4.980641880449086e-05, "epoch": 0.08, "percentage": 3.96, "elapsed_time": "0:44:08", "remaining_time": "17:49:29"} +{"current_steps": 290, "total_steps": 7064, "loss": 0.941, "reward": null, "learning_rate": 4.9792364174763323e-05, "epoch": 0.08, "percentage": 4.11, "elapsed_time": "0:49:35", "remaining_time": "19:18:32"} +{"current_steps": 290, "total_steps": 7064, "loss": 0.941, "reward": null, "learning_rate": 4.9792364174763323e-05, "epoch": 0.08, "percentage": 4.11, "elapsed_time": "0:45:42", "remaining_time": "17:47:51"} +{"current_steps": 290, "total_steps": 7064, "loss": 0.941, "reward": null, "learning_rate": 4.9792364174763323e-05, "epoch": 0.08, "percentage": 4.11, "elapsed_time": "0:45:41", "remaining_time": "17:47:12"} +{"current_steps": 290, "total_steps": 7064, "loss": 0.941, "reward": null, "learning_rate": 4.9792364174763323e-05, "epoch": 0.08, "percentage": 4.11, "elapsed_time": "0:45:42", "remaining_time": "17:47:33"} +{"current_steps": 300, "total_steps": 7064, "loss": 0.9623, "reward": null, "learning_rate": 4.977781918440949e-05, "epoch": 0.08, "percentage": 4.25, "elapsed_time": "0:51:12", "remaining_time": "19:14:33"} +{"current_steps": 300, "total_steps": 7064, "loss": 0.9623, "reward": null, "learning_rate": 4.977781918440949e-05, "epoch": 0.08, "percentage": 4.25, "elapsed_time": "0:47:17", "remaining_time": "17:46:23"} +{"current_steps": 300, "total_steps": 7064, "loss": 0.9623, "reward": null, "learning_rate": 4.977781918440949e-05, "epoch": 0.08, "percentage": 4.25, "elapsed_time": "0:47:18", "remaining_time": "17:46:43"} +{"current_steps": 300, "total_steps": 7064, "loss": 0.9623, "reward": null, "learning_rate": 4.977781918440949e-05, "epoch": 0.08, "percentage": 4.25, "elapsed_time": "0:47:19", "remaining_time": "17:47:01"} +{"current_steps": 310, "total_steps": 7064, "loss": 0.9401, "reward": null, "learning_rate": 4.97627841211103e-05, "epoch": 0.09, "percentage": 4.39, "elapsed_time": "0:48:55", "remaining_time": "17:45:57"} +{"current_steps": 310, "total_steps": 7064, "loss": 0.9401, "reward": null, "learning_rate": 4.97627841211103e-05, "epoch": 0.09, "percentage": 4.39, "elapsed_time": "0:48:54", "remaining_time": "17:45:39"} +{"current_steps": 310, "total_steps": 7064, "loss": 0.9401, "reward": null, "learning_rate": 4.97627841211103e-05, "epoch": 0.09, "percentage": 4.39, "elapsed_time": "0:48:53", "remaining_time": "17:45:20"} +{"current_steps": 310, "total_steps": 7064, "loss": 0.9401, "reward": null, "learning_rate": 4.97627841211103e-05, "epoch": 0.09, "percentage": 4.39, "elapsed_time": "0:52:48", "remaining_time": "19:10:31"} +{"current_steps": 320, "total_steps": 7064, "loss": 0.9152, "reward": null, "learning_rate": 4.97472592822397e-05, "epoch": 0.09, "percentage": 4.53, "elapsed_time": "0:54:23", "remaining_time": "19:06:27"} +{"current_steps": 320, "total_steps": 7064, "loss": 0.9152, "reward": null, "learning_rate": 4.97472592822397e-05, "epoch": 0.09, "percentage": 4.53, "elapsed_time": "0:50:30", "remaining_time": "17:44:22"} +{"current_steps": 320, "total_steps": 7064, "loss": 0.9152, "reward": null, "learning_rate": 4.97472592822397e-05, "epoch": 0.09, "percentage": 4.53, "elapsed_time": "0:50:29", "remaining_time": "17:44:03"} +{"current_steps": 320, "total_steps": 7064, "loss": 0.9152, "reward": null, "learning_rate": 4.97472592822397e-05, "epoch": 0.09, "percentage": 4.53, "elapsed_time": "0:50:31", "remaining_time": "17:44:38"} +{"current_steps": 330, "total_steps": 7064, "loss": 0.9405, "reward": null, "learning_rate": 4.9731244974858746e-05, "epoch": 0.09, "percentage": 4.67, "elapsed_time": "0:55:57", "remaining_time": "19:01:52"} +{"current_steps": 330, "total_steps": 7064, "loss": 0.9405, "reward": null, "learning_rate": 4.9731244974858746e-05, "epoch": 0.09, "percentage": 4.67, "elapsed_time": "0:52:04", "remaining_time": "17:42:39"} +{"current_steps": 330, "total_steps": 7064, "loss": 0.9405, "reward": null, "learning_rate": 4.9731244974858746e-05, "epoch": 0.09, "percentage": 4.67, "elapsed_time": "0:52:02", "remaining_time": "17:42:05"} +{"current_steps": 330, "total_steps": 7064, "loss": 0.9405, "reward": null, "learning_rate": 4.9731244974858746e-05, "epoch": 0.09, "percentage": 4.67, "elapsed_time": "0:52:03", "remaining_time": "17:42:23"} +{"current_steps": 340, "total_steps": 7064, "loss": 0.9431, "reward": null, "learning_rate": 4.971474151570955e-05, "epoch": 0.1, "percentage": 4.81, "elapsed_time": "0:57:33", "remaining_time": "18:58:08"} +{"current_steps": 340, "total_steps": 7064, "loss": 0.9431, "reward": null, "learning_rate": 4.971474151570955e-05, "epoch": 0.1, "percentage": 4.81, "elapsed_time": "0:53:40", "remaining_time": "17:41:22"} +{"current_steps": 340, "total_steps": 7064, "loss": 0.9431, "reward": null, "learning_rate": 4.971474151570955e-05, "epoch": 0.1, "percentage": 4.81, "elapsed_time": "0:53:38", "remaining_time": "17:40:49"} +{"current_steps": 340, "total_steps": 7064, "loss": 0.9431, "reward": null, "learning_rate": 4.971474151570955e-05, "epoch": 0.1, "percentage": 4.81, "elapsed_time": "0:53:39", "remaining_time": "17:41:07"} +{"current_steps": 350, "total_steps": 7064, "loss": 0.9512, "reward": null, "learning_rate": 4.9697749231209025e-05, "epoch": 0.1, "percentage": 4.95, "elapsed_time": "0:59:08", "remaining_time": "18:54:38"} +{"current_steps": 350, "total_steps": 7064, "loss": 0.9512, "reward": null, "learning_rate": 4.9697749231209025e-05, "epoch": 0.1, "percentage": 4.95, "elapsed_time": "0:55:16", "remaining_time": "17:40:10"} +{"current_steps": 350, "total_steps": 7064, "loss": 0.9512, "reward": null, "learning_rate": 4.9697749231209025e-05, "epoch": 0.1, "percentage": 4.95, "elapsed_time": "0:55:14", "remaining_time": "17:39:37"} +{"current_steps": 350, "total_steps": 7064, "loss": 0.9512, "reward": null, "learning_rate": 4.9697749231209025e-05, "epoch": 0.1, "percentage": 4.95, "elapsed_time": "0:55:15", "remaining_time": "17:39:55"} +{"current_steps": 360, "total_steps": 7064, "loss": 0.9301, "reward": null, "learning_rate": 4.968026845744237e-05, "epoch": 0.1, "percentage": 5.1, "elapsed_time": "1:00:43", "remaining_time": "18:50:42"} +{"current_steps": 360, "total_steps": 7064, "loss": 0.9301, "reward": null, "learning_rate": 4.968026845744237e-05, "epoch": 0.1, "percentage": 5.1, "elapsed_time": "0:56:48", "remaining_time": "17:37:53"} +{"current_steps": 360, "total_steps": 7064, "loss": 0.9301, "reward": null, "learning_rate": 4.968026845744237e-05, "epoch": 0.1, "percentage": 5.1, "elapsed_time": "0:56:50", "remaining_time": "17:38:25"} +{"current_steps": 360, "total_steps": 7064, "loss": 0.9301, "reward": null, "learning_rate": 4.968026845744237e-05, "epoch": 0.1, "percentage": 5.1, "elapsed_time": "0:56:49", "remaining_time": "17:38:10"} +{"current_steps": 370, "total_steps": 7064, "loss": 0.917, "reward": null, "learning_rate": 4.96622995401565e-05, "epoch": 0.1, "percentage": 5.24, "elapsed_time": "0:58:25", "remaining_time": "17:37:07"} +{"current_steps": 370, "total_steps": 7064, "loss": 0.917, "reward": null, "learning_rate": 4.96622995401565e-05, "epoch": 0.1, "percentage": 5.24, "elapsed_time": "0:58:26", "remaining_time": "17:37:21"} +{"current_steps": 370, "total_steps": 7064, "loss": 0.917, "reward": null, "learning_rate": 4.96622995401565e-05, "epoch": 0.1, "percentage": 5.24, "elapsed_time": "0:58:24", "remaining_time": "17:36:50"} +{"current_steps": 370, "total_steps": 7064, "loss": 0.917, "reward": null, "learning_rate": 4.96622995401565e-05, "epoch": 0.1, "percentage": 5.24, "elapsed_time": "1:02:19", "remaining_time": "18:47:35"} +{"current_steps": 380, "total_steps": 7064, "loss": 0.9162, "reward": null, "learning_rate": 4.9643842834753174e-05, "epoch": 0.11, "percentage": 5.38, "elapsed_time": "0:59:58", "remaining_time": "17:35:02"} +{"current_steps": 380, "total_steps": 7064, "loss": 0.9162, "reward": null, "learning_rate": 4.9643842834753174e-05, "epoch": 0.11, "percentage": 5.38, "elapsed_time": "0:59:58", "remaining_time": "17:34:47"} +{"current_steps": 380, "total_steps": 7064, "loss": 0.9162, "reward": null, "learning_rate": 4.9643842834753174e-05, "epoch": 0.11, "percentage": 5.38, "elapsed_time": "0:59:59", "remaining_time": "17:35:16"} +{"current_steps": 380, "total_steps": 7064, "loss": 0.9162, "reward": null, "learning_rate": 4.9643842834753174e-05, "epoch": 0.11, "percentage": 5.38, "elapsed_time": "1:03:52", "remaining_time": "18:43:33"} +{"current_steps": 390, "total_steps": 7064, "loss": 0.9207, "reward": null, "learning_rate": 4.962489870628193e-05, "epoch": 0.11, "percentage": 5.52, "elapsed_time": "1:01:36", "remaining_time": "17:34:11"} +{"current_steps": 390, "total_steps": 7064, "loss": 0.9207, "reward": null, "learning_rate": 4.962489870628193e-05, "epoch": 0.11, "percentage": 5.52, "elapsed_time": "1:01:36", "remaining_time": "17:34:25"} +{"current_steps": 390, "total_steps": 7064, "loss": 0.9207, "reward": null, "learning_rate": 4.962489870628193e-05, "epoch": 0.11, "percentage": 5.52, "elapsed_time": "1:01:35", "remaining_time": "17:33:56"} +{"current_steps": 390, "total_steps": 7064, "loss": 0.9207, "reward": null, "learning_rate": 4.962489870628193e-05, "epoch": 0.11, "percentage": 5.52, "elapsed_time": "1:05:29", "remaining_time": "18:40:51"} +{"current_steps": 400, "total_steps": 7064, "loss": 0.924, "reward": null, "learning_rate": 4.960546752943294e-05, "epoch": 0.11, "percentage": 5.66, "elapsed_time": "1:07:01", "remaining_time": "18:36:44"} +{"current_steps": 400, "total_steps": 7064, "loss": 0.924, "reward": null, "learning_rate": 4.960546752943294e-05, "epoch": 0.11, "percentage": 5.66, "elapsed_time": "1:03:08", "remaining_time": "17:31:51"} +{"current_steps": 400, "total_steps": 7064, "loss": 0.924, "reward": null, "learning_rate": 4.960546752943294e-05, "epoch": 0.11, "percentage": 5.66, "elapsed_time": "1:03:08", "remaining_time": "17:32:04"} +{"current_steps": 400, "total_steps": 7064, "loss": 0.924, "reward": null, "learning_rate": 4.960546752943294e-05, "epoch": 0.11, "percentage": 5.66, "elapsed_time": "1:03:07", "remaining_time": "17:31:36"} +{"current_steps": 410, "total_steps": 7064, "loss": 0.9025, "reward": null, "learning_rate": 4.958554968852952e-05, "epoch": 0.12, "percentage": 5.8, "elapsed_time": "1:08:37", "remaining_time": "18:33:48"} +{"current_steps": 410, "total_steps": 7064, "loss": 0.9025, "reward": null, "learning_rate": 4.958554968852952e-05, "epoch": 0.12, "percentage": 5.8, "elapsed_time": "1:04:44", "remaining_time": "17:30:35"} +{"current_steps": 410, "total_steps": 7064, "loss": 0.9025, "reward": null, "learning_rate": 4.958554968852952e-05, "epoch": 0.12, "percentage": 5.8, "elapsed_time": "1:04:44", "remaining_time": "17:30:48"} +{"current_steps": 410, "total_steps": 7064, "loss": 0.9025, "reward": null, "learning_rate": 4.958554968852952e-05, "epoch": 0.12, "percentage": 5.8, "elapsed_time": "1:04:43", "remaining_time": "17:30:20"} +{"current_steps": 420, "total_steps": 7064, "loss": 0.9027, "reward": null, "learning_rate": 4.95651455775206e-05, "epoch": 0.12, "percentage": 5.95, "elapsed_time": "1:10:12", "remaining_time": "18:30:37"} +{"current_steps": 420, "total_steps": 7064, "loss": 0.9027, "reward": null, "learning_rate": 4.95651455775206e-05, "epoch": 0.12, "percentage": 5.95, "elapsed_time": "1:06:19", "remaining_time": "17:29:12"} +{"current_steps": 420, "total_steps": 7064, "loss": 0.9027, "reward": null, "learning_rate": 4.95651455775206e-05, "epoch": 0.12, "percentage": 5.95, "elapsed_time": "1:06:17", "remaining_time": "17:28:46"} +{"current_steps": 420, "total_steps": 7064, "loss": 0.9027, "reward": null, "learning_rate": 4.95651455775206e-05, "epoch": 0.12, "percentage": 5.95, "elapsed_time": "1:06:18", "remaining_time": "17:29:00"} +{"current_steps": 430, "total_steps": 7064, "loss": 0.9167, "reward": null, "learning_rate": 4.954425559997287e-05, "epoch": 0.12, "percentage": 6.09, "elapsed_time": "1:11:48", "remaining_time": "18:27:52"} +{"current_steps": 430, "total_steps": 7064, "loss": 0.9167, "reward": null, "learning_rate": 4.954425559997287e-05, "epoch": 0.12, "percentage": 6.09, "elapsed_time": "1:07:54", "remaining_time": "17:27:47"} +{"current_steps": 430, "total_steps": 7064, "loss": 0.9167, "reward": null, "learning_rate": 4.954425559997287e-05, "epoch": 0.12, "percentage": 6.09, "elapsed_time": "1:07:55", "remaining_time": "17:27:59"} +{"current_steps": 430, "total_steps": 7064, "loss": 0.9167, "reward": null, "learning_rate": 4.954425559997287e-05, "epoch": 0.12, "percentage": 6.09, "elapsed_time": "1:07:53", "remaining_time": "17:27:33"} +{"current_steps": 440, "total_steps": 7064, "loss": 0.9119, "reward": null, "learning_rate": 4.952288016906284e-05, "epoch": 0.12, "percentage": 6.23, "elapsed_time": "1:09:28", "remaining_time": "17:25:52"} +{"current_steps": 440, "total_steps": 7064, "loss": 0.9119, "reward": null, "learning_rate": 4.952288016906284e-05, "epoch": 0.12, "percentage": 6.23, "elapsed_time": "1:09:27", "remaining_time": "17:25:40"} +{"current_steps": 440, "total_steps": 7064, "loss": 0.9119, "reward": null, "learning_rate": 4.952288016906284e-05, "epoch": 0.12, "percentage": 6.23, "elapsed_time": "1:09:26", "remaining_time": "17:25:26"} +{"current_steps": 440, "total_steps": 7064, "loss": 0.9119, "reward": null, "learning_rate": 4.952288016906284e-05, "epoch": 0.12, "percentage": 6.23, "elapsed_time": "1:13:21", "remaining_time": "18:24:18"} +{"current_steps": 450, "total_steps": 7064, "loss": 0.9042, "reward": null, "learning_rate": 4.9501019707568665e-05, "epoch": 0.13, "percentage": 6.37, "elapsed_time": "1:11:03", "remaining_time": "17:24:25"} +{"current_steps": 450, "total_steps": 7064, "loss": 0.9042, "reward": null, "learning_rate": 4.9501019707568665e-05, "epoch": 0.13, "percentage": 6.37, "elapsed_time": "1:11:01", "remaining_time": "17:24:00"} +{"current_steps": 450, "total_steps": 7064, "loss": 0.9042, "reward": null, "learning_rate": 4.9501019707568665e-05, "epoch": 0.13, "percentage": 6.37, "elapsed_time": "1:11:02", "remaining_time": "17:24:14"} +{"current_steps": 450, "total_steps": 7064, "loss": 0.9042, "reward": null, "learning_rate": 4.9501019707568665e-05, "epoch": 0.13, "percentage": 6.37, "elapsed_time": "1:14:56", "remaining_time": "18:21:29"} +{"current_steps": 460, "total_steps": 7064, "loss": 0.9113, "reward": null, "learning_rate": 4.947867464786174e-05, "epoch": 0.13, "percentage": 6.51, "elapsed_time": "1:12:36", "remaining_time": "17:22:24"} +{"current_steps": 460, "total_steps": 7064, "loss": 0.9113, "reward": null, "learning_rate": 4.947867464786174e-05, "epoch": 0.13, "percentage": 6.51, "elapsed_time": "1:12:38", "remaining_time": "17:22:48"} +{"current_steps": 460, "total_steps": 7064, "loss": 0.9113, "reward": null, "learning_rate": 4.947867464786174e-05, "epoch": 0.13, "percentage": 6.51, "elapsed_time": "1:12:37", "remaining_time": "17:22:37"} +{"current_steps": 460, "total_steps": 7064, "loss": 0.9113, "reward": null, "learning_rate": 4.947867464786174e-05, "epoch": 0.13, "percentage": 6.51, "elapsed_time": "1:16:31", "remaining_time": "18:18:32"} +{"current_steps": 470, "total_steps": 7064, "loss": 0.9297, "reward": null, "learning_rate": 4.945584543189823e-05, "epoch": 0.13, "percentage": 6.65, "elapsed_time": "1:18:05", "remaining_time": "18:15:30"} +{"current_steps": 470, "total_steps": 7064, "loss": 0.9297, "reward": null, "learning_rate": 4.945584543189823e-05, "epoch": 0.13, "percentage": 6.65, "elapsed_time": "1:14:10", "remaining_time": "17:20:39"} +{"current_steps": 470, "total_steps": 7064, "loss": 0.9297, "reward": null, "learning_rate": 4.945584543189823e-05, "epoch": 0.13, "percentage": 6.65, "elapsed_time": "1:14:11", "remaining_time": "17:20:52"} +{"current_steps": 470, "total_steps": 7064, "loss": 0.9297, "reward": null, "learning_rate": 4.945584543189823e-05, "epoch": 0.13, "percentage": 6.65, "elapsed_time": "1:14:12", "remaining_time": "17:21:03"} +{"current_steps": 480, "total_steps": 7064, "loss": 0.9194, "reward": null, "learning_rate": 4.943253251121022e-05, "epoch": 0.14, "percentage": 6.8, "elapsed_time": "1:19:39", "remaining_time": "18:12:39"} +{"current_steps": 480, "total_steps": 7064, "loss": 0.9194, "reward": null, "learning_rate": 4.943253251121022e-05, "epoch": 0.14, "percentage": 6.8, "elapsed_time": "1:15:44", "remaining_time": "17:19:01"} +{"current_steps": 480, "total_steps": 7064, "loss": 0.9194, "reward": null, "learning_rate": 4.943253251121022e-05, "epoch": 0.14, "percentage": 6.8, "elapsed_time": "1:15:46", "remaining_time": "17:19:24"} +{"current_steps": 480, "total_steps": 7064, "loss": 0.9194, "reward": null, "learning_rate": 4.943253251121022e-05, "epoch": 0.14, "percentage": 6.8, "elapsed_time": "1:15:45", "remaining_time": "17:19:13"} +{"current_steps": 490, "total_steps": 7064, "loss": 0.8978, "reward": null, "learning_rate": 4.9408736346896894e-05, "epoch": 0.14, "percentage": 6.94, "elapsed_time": "1:17:22", "remaining_time": "17:18:05"} +{"current_steps": 490, "total_steps": 7064, "loss": 0.8978, "reward": null, "learning_rate": 4.9408736346896894e-05, "epoch": 0.14, "percentage": 6.94, "elapsed_time": "1:21:17", "remaining_time": "18:10:33"} +{"current_steps": 490, "total_steps": 7064, "loss": 0.8978, "reward": null, "learning_rate": 4.9408736346896894e-05, "epoch": 0.14, "percentage": 6.94, "elapsed_time": "1:17:23", "remaining_time": "17:18:18"} +{"current_steps": 490, "total_steps": 7064, "loss": 0.8978, "reward": null, "learning_rate": 4.9408736346896894e-05, "epoch": 0.14, "percentage": 6.94, "elapsed_time": "1:17:24", "remaining_time": "17:18:28"} +{"current_steps": 500, "total_steps": 7064, "loss": 0.9217, "reward": null, "learning_rate": 4.938445740961534e-05, "epoch": 0.14, "percentage": 7.08, "elapsed_time": "1:22:57", "remaining_time": "18:08:58"} +{"current_steps": 500, "total_steps": 7064, "loss": 0.9217, "reward": null, "learning_rate": 4.938445740961534e-05, "epoch": 0.14, "percentage": 7.08, "elapsed_time": "1:19:02", "remaining_time": "17:17:38"} +{"current_steps": 500, "total_steps": 7064, "loss": 0.9217, "reward": null, "learning_rate": 4.938445740961534e-05, "epoch": 0.14, "percentage": 7.08, "elapsed_time": "1:19:04", "remaining_time": "17:18:00"} +{"current_steps": 500, "total_steps": 7064, "loss": 0.9217, "reward": null, "learning_rate": 4.938445740961534e-05, "epoch": 0.14, "percentage": 7.08, "elapsed_time": "1:19:03", "remaining_time": "17:17:50"} +{"current_steps": 510, "total_steps": 7064, "loss": 0.8997, "reward": null, "learning_rate": 4.935969617957126e-05, "epoch": 0.14, "percentage": 7.22, "elapsed_time": "1:24:37", "remaining_time": "18:07:33"} +{"current_steps": 510, "total_steps": 7064, "loss": 0.8997, "reward": null, "learning_rate": 4.935969617957126e-05, "epoch": 0.14, "percentage": 7.22, "elapsed_time": "1:20:44", "remaining_time": "17:17:40"} +{"current_steps": 510, "total_steps": 7064, "loss": 0.8997, "reward": null, "learning_rate": 4.935969617957126e-05, "epoch": 0.14, "percentage": 7.22, "elapsed_time": "1:20:43", "remaining_time": "17:17:18"} +{"current_steps": 510, "total_steps": 7064, "loss": 0.8997, "reward": null, "learning_rate": 4.935969617957126e-05, "epoch": 0.14, "percentage": 7.22, "elapsed_time": "1:20:43", "remaining_time": "17:17:29"} +{"current_steps": 520, "total_steps": 7064, "loss": 0.9045, "reward": null, "learning_rate": 4.93344531465095e-05, "epoch": 0.15, "percentage": 7.36, "elapsed_time": "1:26:11", "remaining_time": "18:04:47"} +{"current_steps": 520, "total_steps": 7064, "loss": 0.9045, "reward": null, "learning_rate": 4.93344531465095e-05, "epoch": 0.15, "percentage": 7.36, "elapsed_time": "1:22:19", "remaining_time": "17:15:56"} +{"current_steps": 520, "total_steps": 7064, "loss": 0.9045, "reward": null, "learning_rate": 4.93344531465095e-05, "epoch": 0.15, "percentage": 7.36, "elapsed_time": "1:22:17", "remaining_time": "17:15:35"} +{"current_steps": 520, "total_steps": 7064, "loss": 0.9045, "reward": null, "learning_rate": 4.93344531465095e-05, "epoch": 0.15, "percentage": 7.36, "elapsed_time": "1:22:18", "remaining_time": "17:15:46"} +{"current_steps": 530, "total_steps": 7064, "loss": 0.8985, "reward": null, "learning_rate": 4.930872880970432e-05, "epoch": 0.15, "percentage": 7.5, "elapsed_time": "1:23:51", "remaining_time": "17:13:52"} +{"current_steps": 530, "total_steps": 7064, "loss": 0.8985, "reward": null, "learning_rate": 4.930872880970432e-05, "epoch": 0.15, "percentage": 7.5, "elapsed_time": "1:27:44", "remaining_time": "18:01:44"} +{"current_steps": 530, "total_steps": 7064, "loss": 0.8985, "reward": null, "learning_rate": 4.930872880970432e-05, "epoch": 0.15, "percentage": 7.5, "elapsed_time": "1:23:50", "remaining_time": "17:13:32"} +{"current_steps": 530, "total_steps": 7064, "loss": 0.8985, "reward": null, "learning_rate": 4.930872880970432e-05, "epoch": 0.15, "percentage": 7.5, "elapsed_time": "1:23:50", "remaining_time": "17:13:43"} +{"current_steps": 540, "total_steps": 7064, "loss": 0.9171, "reward": null, "learning_rate": 4.9282523677949556e-05, "epoch": 0.15, "percentage": 7.64, "elapsed_time": "1:29:17", "remaining_time": "17:58:42"} +{"current_steps": 540, "total_steps": 7064, "loss": 0.9171, "reward": null, "learning_rate": 4.9282523677949556e-05, "epoch": 0.15, "percentage": 7.64, "elapsed_time": "1:25:24", "remaining_time": "17:11:48"} +{"current_steps": 540, "total_steps": 7064, "loss": 0.9171, "reward": null, "learning_rate": 4.9282523677949556e-05, "epoch": 0.15, "percentage": 7.64, "elapsed_time": "1:25:22", "remaining_time": "17:11:27"} +{"current_steps": 540, "total_steps": 7064, "loss": 0.9171, "reward": null, "learning_rate": 4.9282523677949556e-05, "epoch": 0.15, "percentage": 7.64, "elapsed_time": "1:25:23", "remaining_time": "17:11:38"} +{"current_steps": 550, "total_steps": 7064, "loss": 0.9001, "reward": null, "learning_rate": 4.9255838269548524e-05, "epoch": 0.16, "percentage": 7.79, "elapsed_time": "1:27:01", "remaining_time": "17:10:36"} +{"current_steps": 550, "total_steps": 7064, "loss": 0.9001, "reward": null, "learning_rate": 4.9255838269548524e-05, "epoch": 0.16, "percentage": 7.79, "elapsed_time": "1:26:59", "remaining_time": "17:10:16"} +{"current_steps": 550, "total_steps": 7064, "loss": 0.9001, "reward": null, "learning_rate": 4.9255838269548524e-05, "epoch": 0.16, "percentage": 7.79, "elapsed_time": "1:30:53", "remaining_time": "17:56:35"} +{"current_steps": 550, "total_steps": 7064, "loss": 0.9001, "reward": null, "learning_rate": 4.9255838269548524e-05, "epoch": 0.16, "percentage": 7.79, "elapsed_time": "1:27:00", "remaining_time": "17:10:27"} +{"current_steps": 560, "total_steps": 7064, "loss": 0.8824, "reward": null, "learning_rate": 4.9228673112303814e-05, "epoch": 0.16, "percentage": 7.93, "elapsed_time": "1:32:30", "remaining_time": "17:54:25"} +{"current_steps": 560, "total_steps": 7064, "loss": 0.8824, "reward": null, "learning_rate": 4.9228673112303814e-05, "epoch": 0.16, "percentage": 7.93, "elapsed_time": "1:28:35", "remaining_time": "17:09:00"} +{"current_steps": 560, "total_steps": 7064, "loss": 0.8824, "reward": null, "learning_rate": 4.9228673112303814e-05, "epoch": 0.16, "percentage": 7.93, "elapsed_time": "1:28:36", "remaining_time": "17:09:11"} +{"current_steps": 560, "total_steps": 7064, "loss": 0.8824, "reward": null, "learning_rate": 4.9228673112303814e-05, "epoch": 0.16, "percentage": 7.93, "elapsed_time": "1:28:37", "remaining_time": "17:09:20"} +{"current_steps": 570, "total_steps": 7064, "loss": 0.9046, "reward": null, "learning_rate": 4.9201028743506794e-05, "epoch": 0.16, "percentage": 8.07, "elapsed_time": "1:34:02", "remaining_time": "17:51:29"} +{"current_steps": 570, "total_steps": 7064, "loss": 0.9046, "reward": null, "learning_rate": 4.9201028743506794e-05, "epoch": 0.16, "percentage": 8.07, "elapsed_time": "1:30:08", "remaining_time": "17:06:56"} +{"current_steps": 570, "total_steps": 7064, "loss": 0.9046, "reward": null, "learning_rate": 4.9201028743506794e-05, "epoch": 0.16, "percentage": 8.07, "elapsed_time": "1:30:09", "remaining_time": "17:07:06"} +{"current_steps": 570, "total_steps": 7064, "loss": 0.9046, "reward": null, "learning_rate": 4.9201028743506794e-05, "epoch": 0.16, "percentage": 8.07, "elapsed_time": "1:30:09", "remaining_time": "17:07:15"} +{"current_steps": 580, "total_steps": 7064, "loss": 0.8888, "reward": null, "learning_rate": 4.917290570992702e-05, "epoch": 0.16, "percentage": 8.21, "elapsed_time": "1:35:37", "remaining_time": "17:49:01"} +{"current_steps": 580, "total_steps": 7064, "loss": 0.8888, "reward": null, "learning_rate": 4.917290570992702e-05, "epoch": 0.16, "percentage": 8.21, "elapsed_time": "1:31:42", "remaining_time": "17:05:18"} +{"current_steps": 580, "total_steps": 7064, "loss": 0.8888, "reward": null, "learning_rate": 4.917290570992702e-05, "epoch": 0.16, "percentage": 8.21, "elapsed_time": "1:31:43", "remaining_time": "17:05:28"} +{"current_steps": 580, "total_steps": 7064, "loss": 0.8888, "reward": null, "learning_rate": 4.917290570992702e-05, "epoch": 0.16, "percentage": 8.21, "elapsed_time": "1:31:44", "remaining_time": "17:05:37"} +{"current_steps": 590, "total_steps": 7064, "loss": 0.889, "reward": null, "learning_rate": 4.9144304567801415e-05, "epoch": 0.17, "percentage": 8.35, "elapsed_time": "1:37:07", "remaining_time": "17:45:49"} +{"current_steps": 590, "total_steps": 7064, "loss": 0.889, "reward": null, "learning_rate": 4.9144304567801415e-05, "epoch": 0.17, "percentage": 8.35, "elapsed_time": "1:33:15", "remaining_time": "17:03:13"} +{"current_steps": 590, "total_steps": 7064, "loss": 0.889, "reward": null, "learning_rate": 4.9144304567801415e-05, "epoch": 0.17, "percentage": 8.35, "elapsed_time": "1:33:13", "remaining_time": "17:02:54"} +{"current_steps": 590, "total_steps": 7064, "loss": 0.889, "reward": null, "learning_rate": 4.9144304567801415e-05, "epoch": 0.17, "percentage": 8.35, "elapsed_time": "1:33:14", "remaining_time": "17:03:04"} +{"current_steps": 600, "total_steps": 7064, "loss": 0.906, "reward": null, "learning_rate": 4.911522588282327e-05, "epoch": 0.17, "percentage": 8.49, "elapsed_time": "1:34:51", "remaining_time": "17:01:55"} +{"current_steps": 600, "total_steps": 7064, "loss": 0.906, "reward": null, "learning_rate": 4.911522588282327e-05, "epoch": 0.17, "percentage": 8.49, "elapsed_time": "1:38:44", "remaining_time": "17:43:44"} +{"current_steps": 600, "total_steps": 7064, "loss": 0.906, "reward": null, "learning_rate": 4.911522588282327e-05, "epoch": 0.17, "percentage": 8.49, "elapsed_time": "1:34:49", "remaining_time": "17:01:37"} +{"current_steps": 600, "total_steps": 7064, "loss": 0.906, "reward": null, "learning_rate": 4.911522588282327e-05, "epoch": 0.17, "percentage": 8.49, "elapsed_time": "1:34:50", "remaining_time": "17:01:47"} +{"current_steps": 610, "total_steps": 7064, "loss": 0.8858, "reward": null, "learning_rate": 4.908567023013104e-05, "epoch": 0.17, "percentage": 8.64, "elapsed_time": "1:36:25", "remaining_time": "17:00:09"} +{"current_steps": 610, "total_steps": 7064, "loss": 0.8858, "reward": null, "learning_rate": 4.908567023013104e-05, "epoch": 0.17, "percentage": 8.64, "elapsed_time": "1:36:26", "remaining_time": "17:00:18"} +{"current_steps": 610, "total_steps": 7064, "loss": 0.8858, "reward": null, "learning_rate": 4.908567023013104e-05, "epoch": 0.17, "percentage": 8.64, "elapsed_time": "1:36:24", "remaining_time": "17:00:00"} +{"current_steps": 610, "total_steps": 7064, "loss": 0.8858, "reward": null, "learning_rate": 4.908567023013104e-05, "epoch": 0.17, "percentage": 8.64, "elapsed_time": "1:40:18", "remaining_time": "17:41:22"} +{"current_steps": 620, "total_steps": 7064, "loss": 0.8862, "reward": null, "learning_rate": 4.9055638194296994e-05, "epoch": 0.18, "percentage": 8.78, "elapsed_time": "1:38:01", "remaining_time": "16:58:44"} +{"current_steps": 620, "total_steps": 7064, "loss": 0.8862, "reward": null, "learning_rate": 4.9055638194296994e-05, "epoch": 0.18, "percentage": 8.78, "elapsed_time": "1:37:59", "remaining_time": "16:58:27"} +{"current_steps": 620, "total_steps": 7064, "loss": 0.8862, "reward": null, "learning_rate": 4.9055638194296994e-05, "epoch": 0.18, "percentage": 8.78, "elapsed_time": "1:38:00", "remaining_time": "16:58:36"} +{"current_steps": 620, "total_steps": 7064, "loss": 0.8862, "reward": null, "learning_rate": 4.9055638194296994e-05, "epoch": 0.18, "percentage": 8.78, "elapsed_time": "1:41:53", "remaining_time": "17:39:05"} +{"current_steps": 630, "total_steps": 7064, "loss": 0.8983, "reward": null, "learning_rate": 4.902513036931562e-05, "epoch": 0.18, "percentage": 8.92, "elapsed_time": "1:39:34", "remaining_time": "16:56:59"} +{"current_steps": 630, "total_steps": 7064, "loss": 0.8983, "reward": null, "learning_rate": 4.902513036931562e-05, "epoch": 0.18, "percentage": 8.92, "elapsed_time": "1:43:28", "remaining_time": "17:36:46"} +{"current_steps": 630, "total_steps": 7064, "loss": 0.8983, "reward": null, "learning_rate": 4.902513036931562e-05, "epoch": 0.18, "percentage": 8.92, "elapsed_time": "1:39:33", "remaining_time": "16:56:50"} +{"current_steps": 630, "total_steps": 7064, "loss": 0.8983, "reward": null, "learning_rate": 4.902513036931562e-05, "epoch": 0.18, "percentage": 8.92, "elapsed_time": "1:39:35", "remaining_time": "16:57:07"} +{"current_steps": 640, "total_steps": 7064, "loss": 0.8967, "reward": null, "learning_rate": 4.89941473585919e-05, "epoch": 0.18, "percentage": 9.06, "elapsed_time": "1:41:07", "remaining_time": "16:54:58"} +{"current_steps": 640, "total_steps": 7064, "loss": 0.8967, "reward": null, "learning_rate": 4.89941473585919e-05, "epoch": 0.18, "percentage": 9.06, "elapsed_time": "1:41:07", "remaining_time": "16:55:06"} +{"current_steps": 640, "total_steps": 7064, "loss": 0.8967, "reward": null, "learning_rate": 4.89941473585919e-05, "epoch": 0.18, "percentage": 9.06, "elapsed_time": "1:41:06", "remaining_time": "16:54:49"} +{"current_steps": 640, "total_steps": 7064, "loss": 0.8967, "reward": null, "learning_rate": 4.89941473585919e-05, "epoch": 0.18, "percentage": 9.06, "elapsed_time": "1:45:00", "remaining_time": "17:34:04"} +{"current_steps": 650, "total_steps": 7064, "loss": 0.8925, "reward": null, "learning_rate": 4.89626897749294e-05, "epoch": 0.18, "percentage": 9.2, "elapsed_time": "1:46:37", "remaining_time": "17:32:08"} +{"current_steps": 650, "total_steps": 7064, "loss": 0.8925, "reward": null, "learning_rate": 4.89626897749294e-05, "epoch": 0.18, "percentage": 9.2, "elapsed_time": "1:42:44", "remaining_time": "16:53:50"} +{"current_steps": 650, "total_steps": 7064, "loss": 0.8925, "reward": null, "learning_rate": 4.89626897749294e-05, "epoch": 0.18, "percentage": 9.2, "elapsed_time": "1:42:42", "remaining_time": "16:53:33"} +{"current_steps": 650, "total_steps": 7064, "loss": 0.8925, "reward": null, "learning_rate": 4.89626897749294e-05, "epoch": 0.18, "percentage": 9.2, "elapsed_time": "1:42:43", "remaining_time": "16:53:42"} +{"current_steps": 660, "total_steps": 7064, "loss": 0.883, "reward": null, "learning_rate": 4.893075824051807e-05, "epoch": 0.19, "percentage": 9.34, "elapsed_time": "1:48:11", "remaining_time": "17:29:51"} +{"current_steps": 660, "total_steps": 7064, "loss": 0.883, "reward": null, "learning_rate": 4.893075824051807e-05, "epoch": 0.19, "percentage": 9.34, "elapsed_time": "1:44:18", "remaining_time": "16:52:04"} +{"current_steps": 660, "total_steps": 7064, "loss": 0.883, "reward": null, "learning_rate": 4.893075824051807e-05, "epoch": 0.19, "percentage": 9.34, "elapsed_time": "1:44:17", "remaining_time": "16:51:55"} +{"current_steps": 660, "total_steps": 7064, "loss": 0.883, "reward": null, "learning_rate": 4.893075824051807e-05, "epoch": 0.19, "percentage": 9.34, "elapsed_time": "1:44:19", "remaining_time": "16:52:11"} +{"current_steps": 670, "total_steps": 7064, "loss": 0.8823, "reward": null, "learning_rate": 4.889835338692201e-05, "epoch": 0.19, "percentage": 9.48, "elapsed_time": "1:49:45", "remaining_time": "17:27:23"} +{"current_steps": 670, "total_steps": 7064, "loss": 0.8823, "reward": null, "learning_rate": 4.889835338692201e-05, "epoch": 0.19, "percentage": 9.48, "elapsed_time": "1:45:50", "remaining_time": "16:50:04"} +{"current_steps": 670, "total_steps": 7064, "loss": 0.8823, "reward": null, "learning_rate": 4.889835338692201e-05, "epoch": 0.19, "percentage": 9.48, "elapsed_time": "1:45:52", "remaining_time": "16:50:20"} +{"current_steps": 670, "total_steps": 7064, "loss": 0.8823, "reward": null, "learning_rate": 4.889835338692201e-05, "epoch": 0.19, "percentage": 9.48, "elapsed_time": "1:45:51", "remaining_time": "16:50:13"} +{"current_steps": 680, "total_steps": 7064, "loss": 0.8937, "reward": null, "learning_rate": 4.886547585506698e-05, "epoch": 0.19, "percentage": 9.63, "elapsed_time": "1:51:23", "remaining_time": "17:25:43"} +{"current_steps": 680, "total_steps": 7064, "loss": 0.8937, "reward": null, "learning_rate": 4.886547585506698e-05, "epoch": 0.19, "percentage": 9.63, "elapsed_time": "1:47:28", "remaining_time": "16:49:00"} +{"current_steps": 680, "total_steps": 7064, "loss": 0.8937, "reward": null, "learning_rate": 4.886547585506698e-05, "epoch": 0.19, "percentage": 9.63, "elapsed_time": "1:47:29", "remaining_time": "16:49:09"} +{"current_steps": 680, "total_steps": 7064, "loss": 0.8937, "reward": null, "learning_rate": 4.886547585506698e-05, "epoch": 0.19, "percentage": 9.63, "elapsed_time": "1:47:30", "remaining_time": "16:49:16"} +{"current_steps": 690, "total_steps": 7064, "loss": 0.8695, "reward": null, "learning_rate": 4.8832126295227656e-05, "epoch": 0.2, "percentage": 9.77, "elapsed_time": "1:49:05", "remaining_time": "16:47:48"} +{"current_steps": 690, "total_steps": 7064, "loss": 0.8695, "reward": null, "learning_rate": 4.8832126295227656e-05, "epoch": 0.2, "percentage": 9.77, "elapsed_time": "1:52:58", "remaining_time": "17:23:40"} +{"current_steps": 690, "total_steps": 7064, "loss": 0.8695, "reward": null, "learning_rate": 4.8832126295227656e-05, "epoch": 0.2, "percentage": 9.77, "elapsed_time": "1:49:04", "remaining_time": "16:47:32"} +{"current_steps": 690, "total_steps": 7064, "loss": 0.8695, "reward": null, "learning_rate": 4.8832126295227656e-05, "epoch": 0.2, "percentage": 9.77, "elapsed_time": "1:49:05", "remaining_time": "16:47:41"} +{"current_steps": 700, "total_steps": 7064, "loss": 0.8873, "reward": null, "learning_rate": 4.879830536701485e-05, "epoch": 0.2, "percentage": 9.91, "elapsed_time": "1:54:35", "remaining_time": "17:21:49"} +{"current_steps": 700, "total_steps": 7064, "loss": 0.8873, "reward": null, "learning_rate": 4.879830536701485e-05, "epoch": 0.2, "percentage": 9.91, "elapsed_time": "1:50:41", "remaining_time": "16:46:16"} +{"current_steps": 700, "total_steps": 7064, "loss": 0.8873, "reward": null, "learning_rate": 4.879830536701485e-05, "epoch": 0.2, "percentage": 9.91, "elapsed_time": "1:50:41", "remaining_time": "16:46:25"} +{"current_steps": 700, "total_steps": 7064, "loss": 0.8873, "reward": null, "learning_rate": 4.879830536701485e-05, "epoch": 0.2, "percentage": 9.91, "elapsed_time": "1:50:42", "remaining_time": "16:46:32"} +{"current_steps": 710, "total_steps": 7064, "loss": 0.8862, "reward": null, "learning_rate": 4.876401373936239e-05, "epoch": 0.2, "percentage": 10.05, "elapsed_time": "1:56:10", "remaining_time": "17:19:45"} +{"current_steps": 710, "total_steps": 7064, "loss": 0.8862, "reward": null, "learning_rate": 4.876401373936239e-05, "epoch": 0.2, "percentage": 10.05, "elapsed_time": "1:52:18", "remaining_time": "16:45:00"} +{"current_steps": 710, "total_steps": 7064, "loss": 0.8862, "reward": null, "learning_rate": 4.876401373936239e-05, "epoch": 0.2, "percentage": 10.05, "elapsed_time": "1:52:16", "remaining_time": "16:44:45"} +{"current_steps": 710, "total_steps": 7064, "loss": 0.8862, "reward": null, "learning_rate": 4.876401373936239e-05, "epoch": 0.2, "percentage": 10.05, "elapsed_time": "1:52:17", "remaining_time": "16:44:53"} +{"current_steps": 720, "total_steps": 7064, "loss": 0.874, "reward": null, "learning_rate": 4.8729252090513964e-05, "epoch": 0.2, "percentage": 10.19, "elapsed_time": "1:57:47", "remaining_time": "17:17:50"} +{"current_steps": 720, "total_steps": 7064, "loss": 0.874, "reward": null, "learning_rate": 4.8729252090513964e-05, "epoch": 0.2, "percentage": 10.19, "elapsed_time": "1:53:52", "remaining_time": "16:43:23"} +{"current_steps": 720, "total_steps": 7064, "loss": 0.874, "reward": null, "learning_rate": 4.8729252090513964e-05, "epoch": 0.2, "percentage": 10.19, "elapsed_time": "1:53:54", "remaining_time": "16:43:38"} +{"current_steps": 720, "total_steps": 7064, "loss": 0.874, "reward": null, "learning_rate": 4.8729252090513964e-05, "epoch": 0.2, "percentage": 10.19, "elapsed_time": "1:53:53", "remaining_time": "16:43:31"} +{"current_steps": 730, "total_steps": 7064, "loss": 0.8834, "reward": null, "learning_rate": 4.869402110800963e-05, "epoch": 0.21, "percentage": 10.33, "elapsed_time": "1:59:24", "remaining_time": "17:16:02"} +{"current_steps": 730, "total_steps": 7064, "loss": 0.8834, "reward": null, "learning_rate": 4.869402110800963e-05, "epoch": 0.21, "percentage": 10.33, "elapsed_time": "1:55:30", "remaining_time": "16:42:14"} +{"current_steps": 730, "total_steps": 7064, "loss": 0.8834, "reward": null, "learning_rate": 4.869402110800963e-05, "epoch": 0.21, "percentage": 10.33, "elapsed_time": "1:55:31", "remaining_time": "16:42:21"} +{"current_steps": 730, "total_steps": 7064, "loss": 0.8834, "reward": null, "learning_rate": 4.869402110800963e-05, "epoch": 0.21, "percentage": 10.33, "elapsed_time": "1:55:29", "remaining_time": "16:42:06"} +{"current_steps": 740, "total_steps": 7064, "loss": 0.8744, "reward": null, "learning_rate": 4.865832148867228e-05, "epoch": 0.21, "percentage": 10.48, "elapsed_time": "1:57:03", "remaining_time": "16:40:25"} +{"current_steps": 740, "total_steps": 7064, "loss": 0.8744, "reward": null, "learning_rate": 4.865832148867228e-05, "epoch": 0.21, "percentage": 10.48, "elapsed_time": "1:57:02", "remaining_time": "16:40:11"} +{"current_steps": 740, "total_steps": 7064, "loss": 0.8744, "reward": null, "learning_rate": 4.865832148867228e-05, "epoch": 0.21, "percentage": 10.48, "elapsed_time": "1:57:03", "remaining_time": "16:40:18"} +{"current_steps": 740, "total_steps": 7064, "loss": 0.8744, "reward": null, "learning_rate": 4.865832148867228e-05, "epoch": 0.21, "percentage": 10.48, "elapsed_time": "2:00:56", "remaining_time": "17:13:36"} +{"current_steps": 750, "total_steps": 7064, "loss": 0.876, "reward": null, "learning_rate": 4.8622153938593816e-05, "epoch": 0.21, "percentage": 10.62, "elapsed_time": "2:02:33", "remaining_time": "17:11:47"} +{"current_steps": 750, "total_steps": 7064, "loss": 0.876, "reward": null, "learning_rate": 4.8622153938593816e-05, "epoch": 0.21, "percentage": 10.62, "elapsed_time": "1:58:39", "remaining_time": "16:38:52"} +{"current_steps": 750, "total_steps": 7064, "loss": 0.876, "reward": null, "learning_rate": 4.8622153938593816e-05, "epoch": 0.21, "percentage": 10.62, "elapsed_time": "1:58:39", "remaining_time": "16:39:00"} +{"current_steps": 750, "total_steps": 7064, "loss": 0.876, "reward": null, "learning_rate": 4.8622153938593816e-05, "epoch": 0.21, "percentage": 10.62, "elapsed_time": "1:58:40", "remaining_time": "16:39:07"} +{"current_steps": 760, "total_steps": 7064, "loss": 0.8874, "reward": null, "learning_rate": 4.8585519173121205e-05, "epoch": 0.22, "percentage": 10.76, "elapsed_time": "2:04:10", "remaining_time": "17:09:56"} +{"current_steps": 760, "total_steps": 7064, "loss": 0.8874, "reward": null, "learning_rate": 4.8585519173121205e-05, "epoch": 0.22, "percentage": 10.76, "elapsed_time": "2:00:17", "remaining_time": "16:37:44"} +{"current_steps": 760, "total_steps": 7064, "loss": 0.8874, "reward": null, "learning_rate": 4.8585519173121205e-05, "epoch": 0.22, "percentage": 10.76, "elapsed_time": "2:00:15", "remaining_time": "16:37:30"} +{"current_steps": 760, "total_steps": 7064, "loss": 0.8874, "reward": null, "learning_rate": 4.8585519173121205e-05, "epoch": 0.22, "percentage": 10.76, "elapsed_time": "2:00:16", "remaining_time": "16:37:38"} +{"current_steps": 770, "total_steps": 7064, "loss": 0.8938, "reward": null, "learning_rate": 4.8548417916842324e-05, "epoch": 0.22, "percentage": 10.9, "elapsed_time": "2:05:42", "remaining_time": "17:07:32"} +{"current_steps": 770, "total_steps": 7064, "loss": 0.8938, "reward": null, "learning_rate": 4.8548417916842324e-05, "epoch": 0.22, "percentage": 10.9, "elapsed_time": "2:01:47", "remaining_time": "16:35:34"} +{"current_steps": 770, "total_steps": 7064, "loss": 0.8938, "reward": null, "learning_rate": 4.8548417916842324e-05, "epoch": 0.22, "percentage": 10.9, "elapsed_time": "2:01:49", "remaining_time": "16:35:48"} +{"current_steps": 770, "total_steps": 7064, "loss": 0.8938, "reward": null, "learning_rate": 4.8548417916842324e-05, "epoch": 0.22, "percentage": 10.9, "elapsed_time": "2:01:48", "remaining_time": "16:35:41"} +{"current_steps": 780, "total_steps": 7064, "loss": 0.8855, "reward": null, "learning_rate": 4.851085090357163e-05, "epoch": 0.22, "percentage": 11.04, "elapsed_time": "2:07:20", "remaining_time": "17:05:51"} +{"current_steps": 780, "total_steps": 7064, "loss": 0.8855, "reward": null, "learning_rate": 4.851085090357163e-05, "epoch": 0.22, "percentage": 11.04, "elapsed_time": "2:03:27", "remaining_time": "16:34:35"} +{"current_steps": 780, "total_steps": 7064, "loss": 0.8855, "reward": null, "learning_rate": 4.851085090357163e-05, "epoch": 0.22, "percentage": 11.04, "elapsed_time": "2:03:25", "remaining_time": "16:34:21"} +{"current_steps": 780, "total_steps": 7064, "loss": 0.8855, "reward": null, "learning_rate": 4.851085090357163e-05, "epoch": 0.22, "percentage": 11.04, "elapsed_time": "2:03:26", "remaining_time": "16:34:28"} +{"current_steps": 790, "total_steps": 7064, "loss": 0.8827, "reward": null, "learning_rate": 4.847281887633565e-05, "epoch": 0.22, "percentage": 11.18, "elapsed_time": "2:08:54", "remaining_time": "17:03:47"} +{"current_steps": 790, "total_steps": 7064, "loss": 0.8827, "reward": null, "learning_rate": 4.847281887633565e-05, "epoch": 0.22, "percentage": 11.18, "elapsed_time": "2:05:00", "remaining_time": "16:32:44"} +{"current_steps": 790, "total_steps": 7064, "loss": 0.8827, "reward": null, "learning_rate": 4.847281887633565e-05, "epoch": 0.22, "percentage": 11.18, "elapsed_time": "2:05:01", "remaining_time": "16:32:57"} +{"current_steps": 790, "total_steps": 7064, "loss": 0.8827, "reward": null, "learning_rate": 4.847281887633565e-05, "epoch": 0.22, "percentage": 11.18, "elapsed_time": "2:05:01", "remaining_time": "16:32:51"} +{"current_steps": 800, "total_steps": 7064, "loss": 0.8736, "reward": null, "learning_rate": 4.843432258735827e-05, "epoch": 0.23, "percentage": 11.33, "elapsed_time": "2:06:34", "remaining_time": "16:31:03"} +{"current_steps": 800, "total_steps": 7064, "loss": 0.8736, "reward": null, "learning_rate": 4.843432258735827e-05, "epoch": 0.23, "percentage": 11.33, "elapsed_time": "2:06:35", "remaining_time": "16:31:10"} +{"current_steps": 800, "total_steps": 7064, "loss": 0.8736, "reward": null, "learning_rate": 4.843432258735827e-05, "epoch": 0.23, "percentage": 11.33, "elapsed_time": "2:06:35", "remaining_time": "16:31:16"} +{"current_steps": 800, "total_steps": 7064, "loss": 0.8736, "reward": null, "learning_rate": 4.843432258735827e-05, "epoch": 0.23, "percentage": 11.33, "elapsed_time": "2:10:28", "remaining_time": "17:01:40"} +{"current_steps": 810, "total_steps": 7064, "loss": 0.8907, "reward": null, "learning_rate": 4.839536279804589e-05, "epoch": 0.23, "percentage": 11.47, "elapsed_time": "2:12:02", "remaining_time": "16:59:30"} +{"current_steps": 810, "total_steps": 7064, "loss": 0.8907, "reward": null, "learning_rate": 4.839536279804589e-05, "epoch": 0.23, "percentage": 11.47, "elapsed_time": "2:08:08", "remaining_time": "16:29:26"} +{"current_steps": 810, "total_steps": 7064, "loss": 0.8907, "reward": null, "learning_rate": 4.839536279804589e-05, "epoch": 0.23, "percentage": 11.47, "elapsed_time": "2:08:08", "remaining_time": "16:29:19"} +{"current_steps": 810, "total_steps": 7064, "loss": 0.8907, "reward": null, "learning_rate": 4.839536279804589e-05, "epoch": 0.23, "percentage": 11.47, "elapsed_time": "2:08:09", "remaining_time": "16:29:32"} +{"current_steps": 820, "total_steps": 7064, "loss": 0.862, "reward": null, "learning_rate": 4.835594027897231e-05, "epoch": 0.23, "percentage": 11.61, "elapsed_time": "2:09:42", "remaining_time": "16:27:40"} +{"current_steps": 820, "total_steps": 7064, "loss": 0.862, "reward": null, "learning_rate": 4.835594027897231e-05, "epoch": 0.23, "percentage": 11.61, "elapsed_time": "2:13:36", "remaining_time": "16:57:20"} +{"current_steps": 820, "total_steps": 7064, "loss": 0.862, "reward": null, "learning_rate": 4.835594027897231e-05, "epoch": 0.23, "percentage": 11.61, "elapsed_time": "2:09:41", "remaining_time": "16:27:33"} +{"current_steps": 820, "total_steps": 7064, "loss": 0.862, "reward": null, "learning_rate": 4.835594027897231e-05, "epoch": 0.23, "percentage": 11.61, "elapsed_time": "2:09:43", "remaining_time": "16:27:46"} +{"current_steps": 830, "total_steps": 7064, "loss": 0.8796, "reward": null, "learning_rate": 4.831605580986355e-05, "epoch": 0.23, "percentage": 11.75, "elapsed_time": "2:11:19", "remaining_time": "16:26:24"} +{"current_steps": 830, "total_steps": 7064, "loss": 0.8796, "reward": null, "learning_rate": 4.831605580986355e-05, "epoch": 0.23, "percentage": 11.75, "elapsed_time": "2:11:20", "remaining_time": "16:26:30"} +{"current_steps": 830, "total_steps": 7064, "loss": 0.8796, "reward": null, "learning_rate": 4.831605580986355e-05, "epoch": 0.23, "percentage": 11.75, "elapsed_time": "2:11:19", "remaining_time": "16:26:18"} +{"current_steps": 830, "total_steps": 7064, "loss": 0.8796, "reward": null, "learning_rate": 4.831605580986355e-05, "epoch": 0.23, "percentage": 11.75, "elapsed_time": "2:15:13", "remaining_time": "16:55:40"} +{"current_steps": 840, "total_steps": 7064, "loss": 0.8745, "reward": null, "learning_rate": 4.8275710179582366e-05, "epoch": 0.24, "percentage": 11.89, "elapsed_time": "2:12:52", "remaining_time": "16:24:36"} +{"current_steps": 840, "total_steps": 7064, "loss": 0.8745, "reward": null, "learning_rate": 4.8275710179582366e-05, "epoch": 0.24, "percentage": 11.89, "elapsed_time": "2:12:52", "remaining_time": "16:24:29"} +{"current_steps": 840, "total_steps": 7064, "loss": 0.8745, "reward": null, "learning_rate": 4.8275710179582366e-05, "epoch": 0.24, "percentage": 11.89, "elapsed_time": "2:12:53", "remaining_time": "16:24:41"} +{"current_steps": 840, "total_steps": 7064, "loss": 0.8745, "reward": null, "learning_rate": 4.8275710179582366e-05, "epoch": 0.24, "percentage": 11.89, "elapsed_time": "2:16:46", "remaining_time": "16:53:27"} +{"current_steps": 850, "total_steps": 7064, "loss": 0.8594, "reward": null, "learning_rate": 4.823490418611273e-05, "epoch": 0.24, "percentage": 12.03, "elapsed_time": "2:14:30", "remaining_time": "16:23:16"} +{"current_steps": 850, "total_steps": 7064, "loss": 0.8594, "reward": null, "learning_rate": 4.823490418611273e-05, "epoch": 0.24, "percentage": 12.03, "elapsed_time": "2:14:29", "remaining_time": "16:23:10"} +{"current_steps": 850, "total_steps": 7064, "loss": 0.8594, "reward": null, "learning_rate": 4.823490418611273e-05, "epoch": 0.24, "percentage": 12.03, "elapsed_time": "2:14:30", "remaining_time": "16:23:22"} +{"current_steps": 850, "total_steps": 7064, "loss": 0.8594, "reward": null, "learning_rate": 4.823490418611273e-05, "epoch": 0.24, "percentage": 12.03, "elapsed_time": "2:18:23", "remaining_time": "16:51:45"} +{"current_steps": 860, "total_steps": 7064, "loss": 0.8839, "reward": null, "learning_rate": 4.819363863654395e-05, "epoch": 0.24, "percentage": 12.17, "elapsed_time": "2:16:06", "remaining_time": "16:21:51"} +{"current_steps": 860, "total_steps": 7064, "loss": 0.8839, "reward": null, "learning_rate": 4.819363863654395e-05, "epoch": 0.24, "percentage": 12.17, "elapsed_time": "2:16:07", "remaining_time": "16:21:56"} +{"current_steps": 860, "total_steps": 7064, "loss": 0.8839, "reward": null, "learning_rate": 4.819363863654395e-05, "epoch": 0.24, "percentage": 12.17, "elapsed_time": "2:16:05", "remaining_time": "16:21:44"} +{"current_steps": 860, "total_steps": 7064, "loss": 0.8839, "reward": null, "learning_rate": 4.819363863654395e-05, "epoch": 0.24, "percentage": 12.17, "elapsed_time": "2:20:00", "remaining_time": "16:49:57"} +{"current_steps": 870, "total_steps": 7064, "loss": 0.8536, "reward": null, "learning_rate": 4.8151914347054776e-05, "epoch": 0.25, "percentage": 12.32, "elapsed_time": "2:21:38", "remaining_time": "16:48:24"} +{"current_steps": 870, "total_steps": 7064, "loss": 0.8536, "reward": null, "learning_rate": 4.8151914347054776e-05, "epoch": 0.25, "percentage": 12.32, "elapsed_time": "2:17:44", "remaining_time": "16:20:40"} +{"current_steps": 870, "total_steps": 7064, "loss": 0.8536, "reward": null, "learning_rate": 4.8151914347054776e-05, "epoch": 0.25, "percentage": 12.32, "elapsed_time": "2:17:45", "remaining_time": "16:20:46"} +{"current_steps": 870, "total_steps": 7064, "loss": 0.8536, "reward": null, "learning_rate": 4.8151914347054776e-05, "epoch": 0.25, "percentage": 12.32, "elapsed_time": "2:17:43", "remaining_time": "16:20:34"} +{"current_steps": 880, "total_steps": 7064, "loss": 0.8765, "reward": null, "learning_rate": 4.810973214289724e-05, "epoch": 0.25, "percentage": 12.46, "elapsed_time": "2:19:19", "remaining_time": "16:19:04"} +{"current_steps": 880, "total_steps": 7064, "loss": 0.8765, "reward": null, "learning_rate": 4.810973214289724e-05, "epoch": 0.25, "percentage": 12.46, "elapsed_time": "2:19:18", "remaining_time": "16:18:59"} +{"current_steps": 880, "total_steps": 7064, "loss": 0.8765, "reward": null, "learning_rate": 4.810973214289724e-05, "epoch": 0.25, "percentage": 12.46, "elapsed_time": "2:19:17", "remaining_time": "16:18:52"} +{"current_steps": 880, "total_steps": 7064, "loss": 0.8765, "reward": null, "learning_rate": 4.810973214289724e-05, "epoch": 0.25, "percentage": 12.46, "elapsed_time": "2:23:12", "remaining_time": "16:46:21"} +{"current_steps": 890, "total_steps": 7064, "loss": 0.8726, "reward": null, "learning_rate": 4.806709285838031e-05, "epoch": 0.25, "percentage": 12.6, "elapsed_time": "2:24:49", "remaining_time": "16:44:37"} +{"current_steps": 890, "total_steps": 7064, "loss": 0.8726, "reward": null, "learning_rate": 4.806709285838031e-05, "epoch": 0.25, "percentage": 12.6, "elapsed_time": "2:20:55", "remaining_time": "16:17:36"} +{"current_steps": 890, "total_steps": 7064, "loss": 0.8726, "reward": null, "learning_rate": 4.806709285838031e-05, "epoch": 0.25, "percentage": 12.6, "elapsed_time": "2:20:54", "remaining_time": "16:17:29"} +{"current_steps": 890, "total_steps": 7064, "loss": 0.8726, "reward": null, "learning_rate": 4.806709285838031e-05, "epoch": 0.25, "percentage": 12.6, "elapsed_time": "2:20:56", "remaining_time": "16:17:41"} +{"current_steps": 900, "total_steps": 7064, "loss": 0.8664, "reward": null, "learning_rate": 4.8023997336853434e-05, "epoch": 0.25, "percentage": 12.74, "elapsed_time": "2:26:26", "remaining_time": "16:42:55"} +{"current_steps": 900, "total_steps": 7064, "loss": 0.8664, "reward": null, "learning_rate": 4.8023997336853434e-05, "epoch": 0.25, "percentage": 12.74, "elapsed_time": "2:22:33", "remaining_time": "16:16:20"} +{"current_steps": 900, "total_steps": 7064, "loss": 0.8664, "reward": null, "learning_rate": 4.8023997336853434e-05, "epoch": 0.25, "percentage": 12.74, "elapsed_time": "2:22:32", "remaining_time": "16:16:15"} +{"current_steps": 900, "total_steps": 7064, "loss": 0.8664, "reward": null, "learning_rate": 4.8023997336853434e-05, "epoch": 0.25, "percentage": 12.74, "elapsed_time": "2:22:31", "remaining_time": "16:16:09"} +{"current_steps": 910, "total_steps": 7064, "loss": 0.8805, "reward": null, "learning_rate": 4.7980446430689804e-05, "epoch": 0.26, "percentage": 12.88, "elapsed_time": "2:28:02", "remaining_time": "16:41:09"} +{"current_steps": 910, "total_steps": 7064, "loss": 0.8805, "reward": null, "learning_rate": 4.7980446430689804e-05, "epoch": 0.26, "percentage": 12.88, "elapsed_time": "2:24:09", "remaining_time": "16:14:54"} +{"current_steps": 910, "total_steps": 7064, "loss": 0.8805, "reward": null, "learning_rate": 4.7980446430689804e-05, "epoch": 0.26, "percentage": 12.88, "elapsed_time": "2:24:07", "remaining_time": "16:14:42"} +{"current_steps": 910, "total_steps": 7064, "loss": 0.8805, "reward": null, "learning_rate": 4.7980446430689804e-05, "epoch": 0.26, "percentage": 12.88, "elapsed_time": "2:24:08", "remaining_time": "16:14:48"} +{"current_steps": 920, "total_steps": 7064, "loss": 0.878, "reward": null, "learning_rate": 4.793644100126954e-05, "epoch": 0.26, "percentage": 13.02, "elapsed_time": "2:29:32", "remaining_time": "16:38:38"} +{"current_steps": 920, "total_steps": 7064, "loss": 0.878, "reward": null, "learning_rate": 4.793644100126954e-05, "epoch": 0.26, "percentage": 13.02, "elapsed_time": "2:25:39", "remaining_time": "16:12:42"} +{"current_steps": 920, "total_steps": 7064, "loss": 0.878, "reward": null, "learning_rate": 4.793644100126954e-05, "epoch": 0.26, "percentage": 13.02, "elapsed_time": "2:25:37", "remaining_time": "16:12:31"} +{"current_steps": 920, "total_steps": 7064, "loss": 0.878, "reward": null, "learning_rate": 4.793644100126954e-05, "epoch": 0.26, "percentage": 13.02, "elapsed_time": "2:25:38", "remaining_time": "16:12:37"} +{"current_steps": 930, "total_steps": 7064, "loss": 0.8632, "reward": null, "learning_rate": 4.7891981918962656e-05, "epoch": 0.26, "percentage": 13.17, "elapsed_time": "2:31:05", "remaining_time": "16:36:30"} +{"current_steps": 930, "total_steps": 7064, "loss": 0.8632, "reward": null, "learning_rate": 4.7891981918962656e-05, "epoch": 0.26, "percentage": 13.17, "elapsed_time": "2:27:12", "remaining_time": "16:10:54"} +{"current_steps": 930, "total_steps": 7064, "loss": 0.8632, "reward": null, "learning_rate": 4.7891981918962656e-05, "epoch": 0.26, "percentage": 13.17, "elapsed_time": "2:27:11", "remaining_time": "16:10:49"} +{"current_steps": 930, "total_steps": 7064, "loss": 0.8632, "reward": null, "learning_rate": 4.7891981918962656e-05, "epoch": 0.26, "percentage": 13.17, "elapsed_time": "2:27:10", "remaining_time": "16:10:43"} +{"current_steps": 940, "total_steps": 7064, "loss": 0.8614, "reward": null, "learning_rate": 4.784707006311179e-05, "epoch": 0.27, "percentage": 13.31, "elapsed_time": "2:32:39", "remaining_time": "16:34:35"} +{"current_steps": 940, "total_steps": 7064, "loss": 0.8614, "reward": null, "learning_rate": 4.784707006311179e-05, "epoch": 0.27, "percentage": 13.31, "elapsed_time": "2:28:46", "remaining_time": "16:09:17"} +{"current_steps": 940, "total_steps": 7064, "loss": 0.8614, "reward": null, "learning_rate": 4.784707006311179e-05, "epoch": 0.27, "percentage": 13.31, "elapsed_time": "2:28:45", "remaining_time": "16:09:06"} +{"current_steps": 940, "total_steps": 7064, "loss": 0.8614, "reward": null, "learning_rate": 4.784707006311179e-05, "epoch": 0.27, "percentage": 13.31, "elapsed_time": "2:28:46", "remaining_time": "16:09:12"} +{"current_steps": 950, "total_steps": 7064, "loss": 0.8629, "reward": null, "learning_rate": 4.780170632201487e-05, "epoch": 0.27, "percentage": 13.45, "elapsed_time": "2:34:15", "remaining_time": "16:32:47"} +{"current_steps": 950, "total_steps": 7064, "loss": 0.8629, "reward": null, "learning_rate": 4.780170632201487e-05, "epoch": 0.27, "percentage": 13.45, "elapsed_time": "2:30:21", "remaining_time": "16:07:43"} +{"current_steps": 950, "total_steps": 7064, "loss": 0.8629, "reward": null, "learning_rate": 4.780170632201487e-05, "epoch": 0.27, "percentage": 13.45, "elapsed_time": "2:30:21", "remaining_time": "16:07:37"} +{"current_steps": 950, "total_steps": 7064, "loss": 0.8629, "reward": null, "learning_rate": 4.780170632201487e-05, "epoch": 0.27, "percentage": 13.45, "elapsed_time": "2:30:22", "remaining_time": "16:07:48"} +{"current_steps": 960, "total_steps": 7064, "loss": 0.8635, "reward": null, "learning_rate": 4.7755891592907556e-05, "epoch": 0.27, "percentage": 13.59, "elapsed_time": "2:35:53", "remaining_time": "16:31:13"} +{"current_steps": 960, "total_steps": 7064, "loss": 0.8635, "reward": null, "learning_rate": 4.7755891592907556e-05, "epoch": 0.27, "percentage": 13.59, "elapsed_time": "2:31:59", "remaining_time": "16:06:27"} +{"current_steps": 960, "total_steps": 7064, "loss": 0.8635, "reward": null, "learning_rate": 4.7755891592907556e-05, "epoch": 0.27, "percentage": 13.59, "elapsed_time": "2:32:00", "remaining_time": "16:06:32"} +{"current_steps": 960, "total_steps": 7064, "loss": 0.8635, "reward": null, "learning_rate": 4.7755891592907556e-05, "epoch": 0.27, "percentage": 13.59, "elapsed_time": "2:31:58", "remaining_time": "16:06:21"} +{"current_steps": 970, "total_steps": 7064, "loss": 0.8525, "reward": null, "learning_rate": 4.7709626781945397e-05, "epoch": 0.27, "percentage": 13.73, "elapsed_time": "2:37:26", "remaining_time": "16:29:10"} +{"current_steps": 970, "total_steps": 7064, "loss": 0.8525, "reward": null, "learning_rate": 4.7709626781945397e-05, "epoch": 0.27, "percentage": 13.73, "elapsed_time": "2:33:32", "remaining_time": "16:04:36"} +{"current_steps": 970, "total_steps": 7064, "loss": 0.8525, "reward": null, "learning_rate": 4.7709626781945397e-05, "epoch": 0.27, "percentage": 13.73, "elapsed_time": "2:33:33", "remaining_time": "16:04:41"} +{"current_steps": 970, "total_steps": 7064, "loss": 0.8525, "reward": null, "learning_rate": 4.7709626781945397e-05, "epoch": 0.27, "percentage": 13.73, "elapsed_time": "2:33:34", "remaining_time": "16:04:46"} +{"current_steps": 980, "total_steps": 7064, "loss": 0.8592, "reward": null, "learning_rate": 4.766291280418603e-05, "epoch": 0.28, "percentage": 13.87, "elapsed_time": "2:35:07", "remaining_time": "16:03:00"} +{"current_steps": 980, "total_steps": 7064, "loss": 0.8592, "reward": null, "learning_rate": 4.766291280418603e-05, "epoch": 0.28, "percentage": 13.87, "elapsed_time": "2:39:00", "remaining_time": "16:27:06"} +{"current_steps": 980, "total_steps": 7064, "loss": 0.8592, "reward": null, "learning_rate": 4.766291280418603e-05, "epoch": 0.28, "percentage": 13.87, "elapsed_time": "2:35:05", "remaining_time": "16:02:49"} +{"current_steps": 980, "total_steps": 7064, "loss": 0.8592, "reward": null, "learning_rate": 4.766291280418603e-05, "epoch": 0.28, "percentage": 13.87, "elapsed_time": "2:35:06", "remaining_time": "16:02:55"} +{"current_steps": 990, "total_steps": 7064, "loss": 0.8621, "reward": null, "learning_rate": 4.761575058357101e-05, "epoch": 0.28, "percentage": 14.01, "elapsed_time": "2:36:40", "remaining_time": "16:01:13"} +{"current_steps": 990, "total_steps": 7064, "loss": 0.8621, "reward": null, "learning_rate": 4.761575058357101e-05, "epoch": 0.28, "percentage": 14.01, "elapsed_time": "2:40:33", "remaining_time": "16:25:02"} +{"current_steps": 990, "total_steps": 7064, "loss": 0.8621, "reward": null, "learning_rate": 4.761575058357101e-05, "epoch": 0.28, "percentage": 14.01, "elapsed_time": "2:36:39", "remaining_time": "16:01:08"} +{"current_steps": 990, "total_steps": 7064, "loss": 0.8621, "reward": null, "learning_rate": 4.761575058357101e-05, "epoch": 0.28, "percentage": 14.01, "elapsed_time": "2:36:38", "remaining_time": "16:01:03"} +{"current_steps": 1000, "total_steps": 7064, "loss": 0.8687, "reward": null, "learning_rate": 4.756814105290753e-05, "epoch": 0.28, "percentage": 14.16, "elapsed_time": "2:38:13", "remaining_time": "15:59:29"} +{"current_steps": 1000, "total_steps": 7064, "loss": 0.8687, "reward": null, "learning_rate": 4.756814105290753e-05, "epoch": 0.28, "percentage": 14.16, "elapsed_time": "2:38:14", "remaining_time": "15:59:34"} +{"current_steps": 1000, "total_steps": 7064, "loss": 0.8687, "reward": null, "learning_rate": 4.756814105290753e-05, "epoch": 0.28, "percentage": 14.16, "elapsed_time": "2:38:12", "remaining_time": "15:59:24"} +{"current_steps": 1000, "total_steps": 7064, "loss": 0.8687, "reward": null, "learning_rate": 4.756814105290753e-05, "epoch": 0.28, "percentage": 14.16, "elapsed_time": "2:42:07", "remaining_time": "16:23:06"} +{"current_steps": 1010, "total_steps": 7064, "loss": 0.8524, "reward": null, "learning_rate": 4.7520085153850014e-05, "epoch": 0.29, "percentage": 14.3, "elapsed_time": "2:43:43", "remaining_time": "16:21:22"} +{"current_steps": 1010, "total_steps": 7064, "loss": 0.8524, "reward": null, "learning_rate": 4.7520085153850014e-05, "epoch": 0.29, "percentage": 14.3, "elapsed_time": "2:39:49", "remaining_time": "15:58:01"} +{"current_steps": 1010, "total_steps": 7064, "loss": 0.8524, "reward": null, "learning_rate": 4.7520085153850014e-05, "epoch": 0.29, "percentage": 14.3, "elapsed_time": "2:39:48", "remaining_time": "15:57:56"} +{"current_steps": 1010, "total_steps": 7064, "loss": 0.8524, "reward": null, "learning_rate": 4.7520085153850014e-05, "epoch": 0.29, "percentage": 14.3, "elapsed_time": "2:39:50", "remaining_time": "15:58:06"} +{"current_steps": 1020, "total_steps": 7064, "loss": 0.8687, "reward": null, "learning_rate": 4.7471583836881476e-05, "epoch": 0.29, "percentage": 14.44, "elapsed_time": "2:45:18", "remaining_time": "16:19:31"} +{"current_steps": 1020, "total_steps": 7064, "loss": 0.8687, "reward": null, "learning_rate": 4.7471583836881476e-05, "epoch": 0.29, "percentage": 14.44, "elapsed_time": "2:41:24", "remaining_time": "15:56:26"} +{"current_steps": 1020, "total_steps": 7064, "loss": 0.8687, "reward": null, "learning_rate": 4.7471583836881476e-05, "epoch": 0.29, "percentage": 14.44, "elapsed_time": "2:41:25", "remaining_time": "15:56:30"} +{"current_steps": 1020, "total_steps": 7064, "loss": 0.8687, "reward": null, "learning_rate": 4.7471583836881476e-05, "epoch": 0.29, "percentage": 14.44, "elapsed_time": "2:41:23", "remaining_time": "15:56:20"} +{"current_steps": 1030, "total_steps": 7064, "loss": 0.8505, "reward": null, "learning_rate": 4.742263806129469e-05, "epoch": 0.29, "percentage": 14.58, "elapsed_time": "2:46:56", "remaining_time": "16:17:57"} +{"current_steps": 1030, "total_steps": 7064, "loss": 0.8505, "reward": null, "learning_rate": 4.742263806129469e-05, "epoch": 0.29, "percentage": 14.58, "elapsed_time": "2:43:02", "remaining_time": "15:55:08"} +{"current_steps": 1030, "total_steps": 7064, "loss": 0.8505, "reward": null, "learning_rate": 4.742263806129469e-05, "epoch": 0.29, "percentage": 14.58, "elapsed_time": "2:43:03", "remaining_time": "15:55:13"} +{"current_steps": 1030, "total_steps": 7064, "loss": 0.8505, "reward": null, "learning_rate": 4.742263806129469e-05, "epoch": 0.29, "percentage": 14.58, "elapsed_time": "2:43:01", "remaining_time": "15:55:03"} +{"current_steps": 1040, "total_steps": 7064, "loss": 0.8754, "reward": null, "learning_rate": 4.737324879517326e-05, "epoch": 0.29, "percentage": 14.72, "elapsed_time": "2:44:39", "remaining_time": "15:53:43"} +{"current_steps": 1040, "total_steps": 7064, "loss": 0.8754, "reward": null, "learning_rate": 4.737324879517326e-05, "epoch": 0.29, "percentage": 14.72, "elapsed_time": "2:44:40", "remaining_time": "15:53:48"} +{"current_steps": 1040, "total_steps": 7064, "loss": 0.8754, "reward": null, "learning_rate": 4.737324879517326e-05, "epoch": 0.29, "percentage": 14.72, "elapsed_time": "2:44:38", "remaining_time": "15:53:38"} +{"current_steps": 1040, "total_steps": 7064, "loss": 0.8754, "reward": null, "learning_rate": 4.737324879517326e-05, "epoch": 0.29, "percentage": 14.72, "elapsed_time": "2:48:32", "remaining_time": "16:16:17"} +{"current_steps": 1050, "total_steps": 7064, "loss": 0.8583, "reward": null, "learning_rate": 4.732341701537245e-05, "epoch": 0.3, "percentage": 14.86, "elapsed_time": "2:50:08", "remaining_time": "16:14:31"} +{"current_steps": 1050, "total_steps": 7064, "loss": 0.8583, "reward": null, "learning_rate": 4.732341701537245e-05, "epoch": 0.3, "percentage": 14.86, "elapsed_time": "2:46:14", "remaining_time": "15:52:12"} +{"current_steps": 1050, "total_steps": 7064, "loss": 0.8583, "reward": null, "learning_rate": 4.732341701537245e-05, "epoch": 0.3, "percentage": 14.86, "elapsed_time": "2:46:15", "remaining_time": "15:52:17"} +{"current_steps": 1050, "total_steps": 7064, "loss": 0.8583, "reward": null, "learning_rate": 4.732341701537245e-05, "epoch": 0.3, "percentage": 14.86, "elapsed_time": "2:46:14", "remaining_time": "15:52:07"} +{"current_steps": 1060, "total_steps": 7064, "loss": 0.8698, "reward": null, "learning_rate": 4.727314370749988e-05, "epoch": 0.3, "percentage": 15.01, "elapsed_time": "2:51:45", "remaining_time": "16:12:51"} +{"current_steps": 1060, "total_steps": 7064, "loss": 0.8698, "reward": null, "learning_rate": 4.727314370749988e-05, "epoch": 0.3, "percentage": 15.01, "elapsed_time": "2:47:51", "remaining_time": "15:50:47"} +{"current_steps": 1060, "total_steps": 7064, "loss": 0.8698, "reward": null, "learning_rate": 4.727314370749988e-05, "epoch": 0.3, "percentage": 15.01, "elapsed_time": "2:47:52", "remaining_time": "15:50:51"} +{"current_steps": 1060, "total_steps": 7064, "loss": 0.8698, "reward": null, "learning_rate": 4.727314370749988e-05, "epoch": 0.3, "percentage": 15.01, "elapsed_time": "2:47:50", "remaining_time": "15:50:42"} +{"current_steps": 1070, "total_steps": 7064, "loss": 0.8661, "reward": null, "learning_rate": 4.7222429865896e-05, "epoch": 0.3, "percentage": 15.15, "elapsed_time": "2:53:21", "remaining_time": "16:11:07"} +{"current_steps": 1070, "total_steps": 7064, "loss": 0.8661, "reward": null, "learning_rate": 4.7222429865896e-05, "epoch": 0.3, "percentage": 15.15, "elapsed_time": "2:49:28", "remaining_time": "15:49:22"} +{"current_steps": 1070, "total_steps": 7064, "loss": 0.8661, "reward": null, "learning_rate": 4.7222429865896e-05, "epoch": 0.3, "percentage": 15.15, "elapsed_time": "2:49:26", "remaining_time": "15:49:12"} +{"current_steps": 1070, "total_steps": 7064, "loss": 0.8661, "reward": null, "learning_rate": 4.7222429865896e-05, "epoch": 0.3, "percentage": 15.15, "elapsed_time": "2:49:27", "remaining_time": "15:49:17"} +{"current_steps": 1080, "total_steps": 7064, "loss": 0.8574, "reward": null, "learning_rate": 4.717127649361444e-05, "epoch": 0.31, "percentage": 15.29, "elapsed_time": "2:54:56", "remaining_time": "16:09:17"} +{"current_steps": 1080, "total_steps": 7064, "loss": 0.8574, "reward": null, "learning_rate": 4.717127649361444e-05, "epoch": 0.31, "percentage": 15.29, "elapsed_time": "2:51:01", "remaining_time": "15:47:37"} +{"current_steps": 1080, "total_steps": 7064, "loss": 0.8574, "reward": null, "learning_rate": 4.717127649361444e-05, "epoch": 0.31, "percentage": 15.29, "elapsed_time": "2:51:03", "remaining_time": "15:47:46"} +{"current_steps": 1080, "total_steps": 7064, "loss": 0.8574, "reward": null, "learning_rate": 4.717127649361444e-05, "epoch": 0.31, "percentage": 15.29, "elapsed_time": "2:51:02", "remaining_time": "15:47:42"} +{"current_steps": 1090, "total_steps": 7064, "loss": 0.852, "reward": null, "learning_rate": 4.71196846024022e-05, "epoch": 0.31, "percentage": 15.43, "elapsed_time": "2:56:31", "remaining_time": "16:07:29"} +{"current_steps": 1090, "total_steps": 7064, "loss": 0.852, "reward": null, "learning_rate": 4.71196846024022e-05, "epoch": 0.31, "percentage": 15.43, "elapsed_time": "2:52:37", "remaining_time": "15:46:08"} +{"current_steps": 1090, "total_steps": 7064, "loss": 0.852, "reward": null, "learning_rate": 4.71196846024022e-05, "epoch": 0.31, "percentage": 15.43, "elapsed_time": "2:52:36", "remaining_time": "15:46:03"} +{"current_steps": 1090, "total_steps": 7064, "loss": 0.852, "reward": null, "learning_rate": 4.71196846024022e-05, "epoch": 0.31, "percentage": 15.43, "elapsed_time": "2:52:38", "remaining_time": "15:46:12"} +{"current_steps": 1100, "total_steps": 7064, "loss": 0.8619, "reward": null, "learning_rate": 4.7067655212679585e-05, "epoch": 0.31, "percentage": 15.57, "elapsed_time": "2:58:07", "remaining_time": "16:05:44"} +{"current_steps": 1100, "total_steps": 7064, "loss": 0.8619, "reward": null, "learning_rate": 4.7067655212679585e-05, "epoch": 0.31, "percentage": 15.57, "elapsed_time": "2:54:13", "remaining_time": "15:44:37"} +{"current_steps": 1100, "total_steps": 7064, "loss": 0.8619, "reward": null, "learning_rate": 4.7067655212679585e-05, "epoch": 0.31, "percentage": 15.57, "elapsed_time": "2:54:14", "remaining_time": "15:44:42"} +{"current_steps": 1100, "total_steps": 7064, "loss": 0.8619, "reward": null, "learning_rate": 4.7067655212679585e-05, "epoch": 0.31, "percentage": 15.57, "elapsed_time": "2:54:12", "remaining_time": "15:44:32"} +{"current_steps": 1110, "total_steps": 7064, "loss": 0.8632, "reward": null, "learning_rate": 4.701518935352006e-05, "epoch": 0.31, "percentage": 15.71, "elapsed_time": "2:55:52", "remaining_time": "15:43:22"} +{"current_steps": 1110, "total_steps": 7064, "loss": 0.8632, "reward": null, "learning_rate": 4.701518935352006e-05, "epoch": 0.31, "percentage": 15.71, "elapsed_time": "2:55:51", "remaining_time": "15:43:17"} +{"current_steps": 1110, "total_steps": 7064, "loss": 0.8632, "reward": null, "learning_rate": 4.701518935352006e-05, "epoch": 0.31, "percentage": 15.71, "elapsed_time": "2:55:53", "remaining_time": "15:43:26"} +{"current_steps": 1110, "total_steps": 7064, "loss": 0.8632, "reward": null, "learning_rate": 4.701518935352006e-05, "epoch": 0.31, "percentage": 15.71, "elapsed_time": "2:59:46", "remaining_time": "16:04:16"} +{"current_steps": 1120, "total_steps": 7064, "loss": 0.8529, "reward": null, "learning_rate": 4.69622880626299e-05, "epoch": 0.32, "percentage": 15.86, "elapsed_time": "2:57:29", "remaining_time": "15:41:58"} +{"current_steps": 1120, "total_steps": 7064, "loss": 0.8529, "reward": null, "learning_rate": 4.69622880626299e-05, "epoch": 0.32, "percentage": 15.86, "elapsed_time": "2:57:28", "remaining_time": "15:41:54"} +{"current_steps": 1120, "total_steps": 7064, "loss": 0.8529, "reward": null, "learning_rate": 4.69622880626299e-05, "epoch": 0.32, "percentage": 15.86, "elapsed_time": "2:57:27", "remaining_time": "15:41:49"} +{"current_steps": 1120, "total_steps": 7064, "loss": 0.8529, "reward": null, "learning_rate": 4.69622880626299e-05, "epoch": 0.32, "percentage": 15.86, "elapsed_time": "3:01:22", "remaining_time": "16:02:34"} +{"current_steps": 1130, "total_steps": 7064, "loss": 0.8529, "reward": null, "learning_rate": 4.690895238632762e-05, "epoch": 0.32, "percentage": 16.0, "elapsed_time": "2:59:06", "remaining_time": "15:40:32"} +{"current_steps": 1130, "total_steps": 7064, "loss": 0.8529, "reward": null, "learning_rate": 4.690895238632762e-05, "epoch": 0.32, "percentage": 16.0, "elapsed_time": "2:59:07", "remaining_time": "15:40:36"} +{"current_steps": 1130, "total_steps": 7064, "loss": 0.8529, "reward": null, "learning_rate": 4.690895238632762e-05, "epoch": 0.32, "percentage": 16.0, "elapsed_time": "2:59:05", "remaining_time": "15:40:27"} +{"current_steps": 1130, "total_steps": 7064, "loss": 0.8529, "reward": null, "learning_rate": 4.690895238632762e-05, "epoch": 0.32, "percentage": 16.0, "elapsed_time": "3:02:59", "remaining_time": "16:00:59"} +{"current_steps": 1140, "total_steps": 7064, "loss": 0.8465, "reward": null, "learning_rate": 4.685518337952335e-05, "epoch": 0.32, "percentage": 16.14, "elapsed_time": "3:04:36", "remaining_time": "15:59:18"} +{"current_steps": 1140, "total_steps": 7064, "loss": 0.8465, "reward": null, "learning_rate": 4.685518337952335e-05, "epoch": 0.32, "percentage": 16.14, "elapsed_time": "3:00:43", "remaining_time": "15:39:08"} +{"current_steps": 1140, "total_steps": 7064, "loss": 0.8465, "reward": null, "learning_rate": 4.685518337952335e-05, "epoch": 0.32, "percentage": 16.14, "elapsed_time": "3:00:41", "remaining_time": "15:38:59"} +{"current_steps": 1140, "total_steps": 7064, "loss": 0.8465, "reward": null, "learning_rate": 4.685518337952335e-05, "epoch": 0.32, "percentage": 16.14, "elapsed_time": "3:00:42", "remaining_time": "15:39:04"} +{"current_steps": 1150, "total_steps": 7064, "loss": 0.8604, "reward": null, "learning_rate": 4.680098210569789e-05, "epoch": 0.33, "percentage": 16.28, "elapsed_time": "3:02:18", "remaining_time": "15:37:30"} +{"current_steps": 1150, "total_steps": 7064, "loss": 0.8604, "reward": null, "learning_rate": 4.680098210569789e-05, "epoch": 0.33, "percentage": 16.28, "elapsed_time": "3:06:11", "remaining_time": "15:57:28"} +{"current_steps": 1150, "total_steps": 7064, "loss": 0.8604, "reward": null, "learning_rate": 4.680098210569789e-05, "epoch": 0.33, "percentage": 16.28, "elapsed_time": "3:02:16", "remaining_time": "15:37:21"} +{"current_steps": 1150, "total_steps": 7064, "loss": 0.8604, "reward": null, "learning_rate": 4.680098210569789e-05, "epoch": 0.33, "percentage": 16.28, "elapsed_time": "3:02:17", "remaining_time": "15:37:26"} +{"current_steps": 1160, "total_steps": 7064, "loss": 0.8649, "reward": null, "learning_rate": 4.674634963688177e-05, "epoch": 0.33, "percentage": 16.42, "elapsed_time": "3:07:53", "remaining_time": "15:56:17"} +{"current_steps": 1160, "total_steps": 7064, "loss": 0.8649, "reward": null, "learning_rate": 4.674634963688177e-05, "epoch": 0.33, "percentage": 16.42, "elapsed_time": "3:04:00", "remaining_time": "15:36:32"} +{"current_steps": 1160, "total_steps": 7064, "loss": 0.8649, "reward": null, "learning_rate": 4.674634963688177e-05, "epoch": 0.33, "percentage": 16.42, "elapsed_time": "3:03:58", "remaining_time": "15:36:23"} +{"current_steps": 1160, "total_steps": 7064, "loss": 0.8649, "reward": null, "learning_rate": 4.674634963688177e-05, "epoch": 0.33, "percentage": 16.42, "elapsed_time": "3:03:59", "remaining_time": "15:36:27"} +{"current_steps": 1170, "total_steps": 7064, "loss": 0.8572, "reward": null, "learning_rate": 4.669128705363394e-05, "epoch": 0.33, "percentage": 16.56, "elapsed_time": "3:05:39", "remaining_time": "15:35:15"} +{"current_steps": 1170, "total_steps": 7064, "loss": 0.8572, "reward": null, "learning_rate": 4.669128705363394e-05, "epoch": 0.33, "percentage": 16.56, "elapsed_time": "3:05:40", "remaining_time": "15:35:19"} +{"current_steps": 1170, "total_steps": 7064, "loss": 0.8572, "reward": null, "learning_rate": 4.669128705363394e-05, "epoch": 0.33, "percentage": 16.56, "elapsed_time": "3:05:38", "remaining_time": "15:35:11"} +{"current_steps": 1170, "total_steps": 7064, "loss": 0.8572, "reward": null, "learning_rate": 4.669128705363394e-05, "epoch": 0.33, "percentage": 16.56, "elapsed_time": "3:09:33", "remaining_time": "15:54:53"} +{"current_steps": 1180, "total_steps": 7064, "loss": 0.8634, "reward": null, "learning_rate": 4.663579544502049e-05, "epoch": 0.33, "percentage": 16.7, "elapsed_time": "3:11:08", "remaining_time": "15:53:07"} +{"current_steps": 1180, "total_steps": 7064, "loss": 0.8634, "reward": null, "learning_rate": 4.663579544502049e-05, "epoch": 0.33, "percentage": 16.7, "elapsed_time": "3:07:14", "remaining_time": "15:33:42"} +{"current_steps": 1180, "total_steps": 7064, "loss": 0.8634, "reward": null, "learning_rate": 4.663579544502049e-05, "epoch": 0.33, "percentage": 16.7, "elapsed_time": "3:07:13", "remaining_time": "15:33:37"} +{"current_steps": 1180, "total_steps": 7064, "loss": 0.8634, "reward": null, "learning_rate": 4.663579544502049e-05, "epoch": 0.33, "percentage": 16.7, "elapsed_time": "3:07:15", "remaining_time": "15:33:46"} +{"current_steps": 1190, "total_steps": 7064, "loss": 0.8478, "reward": null, "learning_rate": 4.657987590859305e-05, "epoch": 0.34, "percentage": 16.85, "elapsed_time": "3:12:46", "remaining_time": "15:51:32"} +{"current_steps": 1190, "total_steps": 7064, "loss": 0.8478, "reward": null, "learning_rate": 4.657987590859305e-05, "epoch": 0.34, "percentage": 16.85, "elapsed_time": "3:08:52", "remaining_time": "15:32:19"} +{"current_steps": 1190, "total_steps": 7064, "loss": 0.8478, "reward": null, "learning_rate": 4.657987590859305e-05, "epoch": 0.34, "percentage": 16.85, "elapsed_time": "3:08:53", "remaining_time": "15:32:23"} +{"current_steps": 1190, "total_steps": 7064, "loss": 0.8478, "reward": null, "learning_rate": 4.657987590859305e-05, "epoch": 0.34, "percentage": 16.85, "elapsed_time": "3:08:51", "remaining_time": "15:32:14"} +{"current_steps": 1200, "total_steps": 7064, "loss": 0.8475, "reward": null, "learning_rate": 4.652352955036713e-05, "epoch": 0.34, "percentage": 16.99, "elapsed_time": "3:10:34", "remaining_time": "15:31:17"} +{"current_steps": 1200, "total_steps": 7064, "loss": 0.8475, "reward": null, "learning_rate": 4.652352955036713e-05, "epoch": 0.34, "percentage": 16.99, "elapsed_time": "3:10:35", "remaining_time": "15:31:21"} +{"current_steps": 1200, "total_steps": 7064, "loss": 0.8475, "reward": null, "learning_rate": 4.652352955036713e-05, "epoch": 0.34, "percentage": 16.99, "elapsed_time": "3:10:33", "remaining_time": "15:31:13"} +{"current_steps": 1200, "total_steps": 7064, "loss": 0.8475, "reward": null, "learning_rate": 4.652352955036713e-05, "epoch": 0.34, "percentage": 16.99, "elapsed_time": "3:14:28", "remaining_time": "15:50:19"} +{"current_steps": 1210, "total_steps": 7064, "loss": 0.8537, "reward": null, "learning_rate": 4.646675748480019e-05, "epoch": 0.34, "percentage": 17.13, "elapsed_time": "3:16:05", "remaining_time": "15:48:41"} +{"current_steps": 1210, "total_steps": 7064, "loss": 0.8537, "reward": null, "learning_rate": 4.646675748480019e-05, "epoch": 0.34, "percentage": 17.13, "elapsed_time": "3:12:12", "remaining_time": "15:29:54"} +{"current_steps": 1210, "total_steps": 7064, "loss": 0.8537, "reward": null, "learning_rate": 4.646675748480019e-05, "epoch": 0.34, "percentage": 17.13, "elapsed_time": "3:12:10", "remaining_time": "15:29:45"} +{"current_steps": 1210, "total_steps": 7064, "loss": 0.8537, "reward": null, "learning_rate": 4.646675748480019e-05, "epoch": 0.34, "percentage": 17.13, "elapsed_time": "3:12:11", "remaining_time": "15:29:50"} +{"current_steps": 1220, "total_steps": 7064, "loss": 0.8499, "reward": null, "learning_rate": 4.640956083476964e-05, "epoch": 0.35, "percentage": 17.27, "elapsed_time": "3:17:43", "remaining_time": "15:47:08"} +{"current_steps": 1220, "total_steps": 7064, "loss": 0.8499, "reward": null, "learning_rate": 4.640956083476964e-05, "epoch": 0.35, "percentage": 17.27, "elapsed_time": "3:13:50", "remaining_time": "15:28:32"} +{"current_steps": 1220, "total_steps": 7064, "loss": 0.8499, "reward": null, "learning_rate": 4.640956083476964e-05, "epoch": 0.35, "percentage": 17.27, "elapsed_time": "3:13:49", "remaining_time": "15:28:28"} +{"current_steps": 1220, "total_steps": 7064, "loss": 0.8499, "reward": null, "learning_rate": 4.640956083476964e-05, "epoch": 0.35, "percentage": 17.27, "elapsed_time": "3:13:48", "remaining_time": "15:28:24"} +{"current_steps": 1230, "total_steps": 7064, "loss": 0.8467, "reward": null, "learning_rate": 4.635194073155061e-05, "epoch": 0.35, "percentage": 17.41, "elapsed_time": "3:19:22", "remaining_time": "15:45:40"} +{"current_steps": 1230, "total_steps": 7064, "loss": 0.8467, "reward": null, "learning_rate": 4.635194073155061e-05, "epoch": 0.35, "percentage": 17.41, "elapsed_time": "3:15:28", "remaining_time": "15:27:07"} +{"current_steps": 1230, "total_steps": 7064, "loss": 0.8467, "reward": null, "learning_rate": 4.635194073155061e-05, "epoch": 0.35, "percentage": 17.41, "elapsed_time": "3:15:29", "remaining_time": "15:27:15"} +{"current_steps": 1230, "total_steps": 7064, "loss": 0.8467, "reward": null, "learning_rate": 4.635194073155061e-05, "epoch": 0.35, "percentage": 17.41, "elapsed_time": "3:15:28", "remaining_time": "15:27:11"} +{"current_steps": 1240, "total_steps": 7064, "loss": 0.8538, "reward": null, "learning_rate": 4.62938983147936e-05, "epoch": 0.35, "percentage": 17.55, "elapsed_time": "3:20:59", "remaining_time": "15:44:00"} +{"current_steps": 1240, "total_steps": 7064, "loss": 0.8538, "reward": null, "learning_rate": 4.62938983147936e-05, "epoch": 0.35, "percentage": 17.55, "elapsed_time": "3:17:05", "remaining_time": "15:25:43"} +{"current_steps": 1240, "total_steps": 7064, "loss": 0.8538, "reward": null, "learning_rate": 4.62938983147936e-05, "epoch": 0.35, "percentage": 17.55, "elapsed_time": "3:17:06", "remaining_time": "15:25:46"} +{"current_steps": 1240, "total_steps": 7064, "loss": 0.8538, "reward": null, "learning_rate": 4.62938983147936e-05, "epoch": 0.35, "percentage": 17.55, "elapsed_time": "3:17:04", "remaining_time": "15:25:38"} +{"current_steps": 1250, "total_steps": 7064, "loss": 0.8619, "reward": null, "learning_rate": 4.62354347325019e-05, "epoch": 0.35, "percentage": 17.7, "elapsed_time": "3:22:37", "remaining_time": "15:42:25"} +{"current_steps": 1250, "total_steps": 7064, "loss": 0.8619, "reward": null, "learning_rate": 4.62354347325019e-05, "epoch": 0.35, "percentage": 17.7, "elapsed_time": "3:18:42", "remaining_time": "15:24:14"} +{"current_steps": 1250, "total_steps": 7064, "loss": 0.8619, "reward": null, "learning_rate": 4.62354347325019e-05, "epoch": 0.35, "percentage": 17.7, "elapsed_time": "3:18:44", "remaining_time": "15:24:22"} +{"current_steps": 1250, "total_steps": 7064, "loss": 0.8619, "reward": null, "learning_rate": 4.62354347325019e-05, "epoch": 0.35, "percentage": 17.7, "elapsed_time": "3:18:43", "remaining_time": "15:24:18"} +{"current_steps": 1260, "total_steps": 7064, "loss": 0.8593, "reward": null, "learning_rate": 4.6176551141008916e-05, "epoch": 0.36, "percentage": 17.84, "elapsed_time": "3:24:12", "remaining_time": "15:40:40"} +{"current_steps": 1260, "total_steps": 7064, "loss": 0.8593, "reward": null, "learning_rate": 4.6176551141008916e-05, "epoch": 0.36, "percentage": 17.84, "elapsed_time": "3:20:18", "remaining_time": "15:22:39"} +{"current_steps": 1260, "total_steps": 7064, "loss": 0.8593, "reward": null, "learning_rate": 4.6176551141008916e-05, "epoch": 0.36, "percentage": 17.84, "elapsed_time": "3:20:19", "remaining_time": "15:22:47"} +{"current_steps": 1260, "total_steps": 7064, "loss": 0.8593, "reward": null, "learning_rate": 4.6176551141008916e-05, "epoch": 0.36, "percentage": 17.84, "elapsed_time": "3:20:19", "remaining_time": "15:22:43"} +{"current_steps": 1270, "total_steps": 7064, "loss": 0.8484, "reward": null, "learning_rate": 4.611724870495528e-05, "epoch": 0.36, "percentage": 17.98, "elapsed_time": "3:25:51", "remaining_time": "15:39:09"} +{"current_steps": 1270, "total_steps": 7064, "loss": 0.8484, "reward": null, "learning_rate": 4.611724870495528e-05, "epoch": 0.36, "percentage": 17.98, "elapsed_time": "3:21:57", "remaining_time": "15:21:22"} +{"current_steps": 1270, "total_steps": 7064, "loss": 0.8484, "reward": null, "learning_rate": 4.611724870495528e-05, "epoch": 0.36, "percentage": 17.98, "elapsed_time": "3:21:56", "remaining_time": "15:21:18"} +{"current_steps": 1270, "total_steps": 7064, "loss": 0.8484, "reward": null, "learning_rate": 4.611724870495528e-05, "epoch": 0.36, "percentage": 17.98, "elapsed_time": "3:21:58", "remaining_time": "15:21:26"} +{"current_steps": 1280, "total_steps": 7064, "loss": 0.8395, "reward": null, "learning_rate": 4.605752859726583e-05, "epoch": 0.36, "percentage": 18.12, "elapsed_time": "3:27:27", "remaining_time": "15:37:28"} +{"current_steps": 1280, "total_steps": 7064, "loss": 0.8395, "reward": null, "learning_rate": 4.605752859726583e-05, "epoch": 0.36, "percentage": 18.12, "elapsed_time": "3:23:34", "remaining_time": "15:19:52"} +{"current_steps": 1280, "total_steps": 7064, "loss": 0.8395, "reward": null, "learning_rate": 4.605752859726583e-05, "epoch": 0.36, "percentage": 18.12, "elapsed_time": "3:23:33", "remaining_time": "15:19:48"} +{"current_steps": 1280, "total_steps": 7064, "loss": 0.8395, "reward": null, "learning_rate": 4.605752859726583e-05, "epoch": 0.36, "percentage": 18.12, "elapsed_time": "3:23:34", "remaining_time": "15:19:56"} +{"current_steps": 1290, "total_steps": 7064, "loss": 0.8547, "reward": null, "learning_rate": 4.5997391999126397e-05, "epoch": 0.37, "percentage": 18.26, "elapsed_time": "3:25:10", "remaining_time": "15:18:22"} +{"current_steps": 1290, "total_steps": 7064, "loss": 0.8547, "reward": null, "learning_rate": 4.5997391999126397e-05, "epoch": 0.37, "percentage": 18.26, "elapsed_time": "3:29:04", "remaining_time": "15:35:48"} +{"current_steps": 1290, "total_steps": 7064, "loss": 0.8547, "reward": null, "learning_rate": 4.5997391999126397e-05, "epoch": 0.37, "percentage": 18.26, "elapsed_time": "3:25:09", "remaining_time": "15:18:18"} +{"current_steps": 1290, "total_steps": 7064, "loss": 0.8547, "reward": null, "learning_rate": 4.5997391999126397e-05, "epoch": 0.37, "percentage": 18.26, "elapsed_time": "3:25:11", "remaining_time": "15:18:26"} +{"current_steps": 1300, "total_steps": 7064, "loss": 0.8586, "reward": null, "learning_rate": 4.5936840099960465e-05, "epoch": 0.37, "percentage": 18.4, "elapsed_time": "3:30:41", "remaining_time": "15:34:10"} +{"current_steps": 1300, "total_steps": 7064, "loss": 0.8586, "reward": null, "learning_rate": 4.5936840099960465e-05, "epoch": 0.37, "percentage": 18.4, "elapsed_time": "3:26:46", "remaining_time": "15:16:50"} +{"current_steps": 1300, "total_steps": 7064, "loss": 0.8586, "reward": null, "learning_rate": 4.5936840099960465e-05, "epoch": 0.37, "percentage": 18.4, "elapsed_time": "3:26:48", "remaining_time": "15:16:57"} +{"current_steps": 1300, "total_steps": 7064, "loss": 0.8586, "reward": null, "learning_rate": 4.5936840099960465e-05, "epoch": 0.37, "percentage": 18.4, "elapsed_time": "3:26:47", "remaining_time": "15:16:54"} +{"current_steps": 1310, "total_steps": 7064, "loss": 0.839, "reward": null, "learning_rate": 4.587587409740561e-05, "epoch": 0.37, "percentage": 18.54, "elapsed_time": "3:32:18", "remaining_time": "15:32:32"} +{"current_steps": 1310, "total_steps": 7064, "loss": 0.839, "reward": null, "learning_rate": 4.587587409740561e-05, "epoch": 0.37, "percentage": 18.54, "elapsed_time": "3:28:25", "remaining_time": "15:15:29"} +{"current_steps": 1310, "total_steps": 7064, "loss": 0.839, "reward": null, "learning_rate": 4.587587409740561e-05, "epoch": 0.37, "percentage": 18.54, "elapsed_time": "3:28:24", "remaining_time": "15:15:25"} +{"current_steps": 1310, "total_steps": 7064, "loss": 0.839, "reward": null, "learning_rate": 4.587587409740561e-05, "epoch": 0.37, "percentage": 18.54, "elapsed_time": "3:28:23", "remaining_time": "15:15:21"} +{"current_steps": 1320, "total_steps": 7064, "loss": 0.8417, "reward": null, "learning_rate": 4.581449519728986e-05, "epoch": 0.37, "percentage": 18.69, "elapsed_time": "3:30:00", "remaining_time": "15:13:51"} +{"current_steps": 1320, "total_steps": 7064, "loss": 0.8417, "reward": null, "learning_rate": 4.581449519728986e-05, "epoch": 0.37, "percentage": 18.69, "elapsed_time": "3:30:01", "remaining_time": "15:13:54"} +{"current_steps": 1320, "total_steps": 7064, "loss": 0.8417, "reward": null, "learning_rate": 4.581449519728986e-05, "epoch": 0.37, "percentage": 18.69, "elapsed_time": "3:29:59", "remaining_time": "15:13:47"} +{"current_steps": 1320, "total_steps": 7064, "loss": 0.8417, "reward": null, "learning_rate": 4.581449519728986e-05, "epoch": 0.37, "percentage": 18.69, "elapsed_time": "3:33:54", "remaining_time": "15:30:48"} +{"current_steps": 1330, "total_steps": 7064, "loss": 0.8404, "reward": null, "learning_rate": 4.575270461360779e-05, "epoch": 0.38, "percentage": 18.83, "elapsed_time": "3:35:31", "remaining_time": "15:29:10"} +{"current_steps": 1330, "total_steps": 7064, "loss": 0.8404, "reward": null, "learning_rate": 4.575270461360779e-05, "epoch": 0.38, "percentage": 18.83, "elapsed_time": "3:31:38", "remaining_time": "15:12:25"} +{"current_steps": 1330, "total_steps": 7064, "loss": 0.8404, "reward": null, "learning_rate": 4.575270461360779e-05, "epoch": 0.38, "percentage": 18.83, "elapsed_time": "3:31:37", "remaining_time": "15:12:22"} +{"current_steps": 1330, "total_steps": 7064, "loss": 0.8404, "reward": null, "learning_rate": 4.575270461360779e-05, "epoch": 0.38, "percentage": 18.83, "elapsed_time": "3:31:36", "remaining_time": "15:12:18"} +{"current_steps": 1340, "total_steps": 7064, "loss": 0.843, "reward": null, "learning_rate": 4.569050356849655e-05, "epoch": 0.38, "percentage": 18.97, "elapsed_time": "3:37:08", "remaining_time": "15:27:35"} +{"current_steps": 1340, "total_steps": 7064, "loss": 0.843, "reward": null, "learning_rate": 4.569050356849655e-05, "epoch": 0.38, "percentage": 18.97, "elapsed_time": "3:33:14", "remaining_time": "15:10:52"} +{"current_steps": 1340, "total_steps": 7064, "loss": 0.843, "reward": null, "learning_rate": 4.569050356849655e-05, "epoch": 0.38, "percentage": 18.97, "elapsed_time": "3:33:16", "remaining_time": "15:11:00"} +{"current_steps": 1340, "total_steps": 7064, "loss": 0.843, "reward": null, "learning_rate": 4.569050356849655e-05, "epoch": 0.38, "percentage": 18.97, "elapsed_time": "3:33:15", "remaining_time": "15:10:56"} +{"current_steps": 1350, "total_steps": 7064, "loss": 0.8557, "reward": null, "learning_rate": 4.562789329221169e-05, "epoch": 0.38, "percentage": 19.11, "elapsed_time": "3:38:47", "remaining_time": "15:26:01"} +{"current_steps": 1350, "total_steps": 7064, "loss": 0.8557, "reward": null, "learning_rate": 4.562789329221169e-05, "epoch": 0.38, "percentage": 19.11, "elapsed_time": "3:34:53", "remaining_time": "15:09:32"} +{"current_steps": 1350, "total_steps": 7064, "loss": 0.8557, "reward": null, "learning_rate": 4.562789329221169e-05, "epoch": 0.38, "percentage": 19.11, "elapsed_time": "3:34:54", "remaining_time": "15:09:35"} +{"current_steps": 1350, "total_steps": 7064, "loss": 0.8557, "reward": null, "learning_rate": 4.562789329221169e-05, "epoch": 0.38, "percentage": 19.11, "elapsed_time": "3:34:52", "remaining_time": "15:09:28"} +{"current_steps": 1360, "total_steps": 7064, "loss": 0.8504, "reward": null, "learning_rate": 4.5564875023102796e-05, "epoch": 0.39, "percentage": 19.25, "elapsed_time": "3:36:28", "remaining_time": "15:07:56"} +{"current_steps": 1360, "total_steps": 7064, "loss": 0.8504, "reward": null, "learning_rate": 4.5564875023102796e-05, "epoch": 0.39, "percentage": 19.25, "elapsed_time": "3:40:23", "remaining_time": "15:24:20"} +{"current_steps": 1360, "total_steps": 7064, "loss": 0.8504, "reward": null, "learning_rate": 4.5564875023102796e-05, "epoch": 0.39, "percentage": 19.25, "elapsed_time": "3:36:29", "remaining_time": "15:08:00"} +{"current_steps": 1360, "total_steps": 7064, "loss": 0.8504, "reward": null, "learning_rate": 4.5564875023102796e-05, "epoch": 0.39, "percentage": 19.25, "elapsed_time": "3:36:30", "remaining_time": "15:08:03"} +{"current_steps": 1370, "total_steps": 7064, "loss": 0.8579, "reward": null, "learning_rate": 4.550145000758905e-05, "epoch": 0.39, "percentage": 19.39, "elapsed_time": "3:42:01", "remaining_time": "15:22:46"} +{"current_steps": 1370, "total_steps": 7064, "loss": 0.8579, "reward": null, "learning_rate": 4.550145000758905e-05, "epoch": 0.39, "percentage": 19.39, "elapsed_time": "3:38:07", "remaining_time": "15:06:34"} +{"current_steps": 1370, "total_steps": 7064, "loss": 0.8579, "reward": null, "learning_rate": 4.550145000758905e-05, "epoch": 0.39, "percentage": 19.39, "elapsed_time": "3:38:06", "remaining_time": "15:06:31"} +{"current_steps": 1370, "total_steps": 7064, "loss": 0.8579, "reward": null, "learning_rate": 4.550145000758905e-05, "epoch": 0.39, "percentage": 19.39, "elapsed_time": "3:38:08", "remaining_time": "15:06:38"} +{"current_steps": 1380, "total_steps": 7064, "loss": 0.8563, "reward": null, "learning_rate": 4.543761950013453e-05, "epoch": 0.39, "percentage": 19.54, "elapsed_time": "3:43:37", "remaining_time": "15:21:05"} +{"current_steps": 1380, "total_steps": 7064, "loss": 0.8563, "reward": null, "learning_rate": 4.543761950013453e-05, "epoch": 0.39, "percentage": 19.54, "elapsed_time": "3:39:44", "remaining_time": "15:05:03"} +{"current_steps": 1380, "total_steps": 7064, "loss": 0.8563, "reward": null, "learning_rate": 4.543761950013453e-05, "epoch": 0.39, "percentage": 19.54, "elapsed_time": "3:39:43", "remaining_time": "15:04:59"} +{"current_steps": 1380, "total_steps": 7064, "loss": 0.8563, "reward": null, "learning_rate": 4.543761950013453e-05, "epoch": 0.39, "percentage": 19.54, "elapsed_time": "3:39:44", "remaining_time": "15:05:06"} +{"current_steps": 1390, "total_steps": 7064, "loss": 0.8446, "reward": null, "learning_rate": 4.537338476322341e-05, "epoch": 0.39, "percentage": 19.68, "elapsed_time": "3:45:15", "remaining_time": "15:19:32"} +{"current_steps": 1390, "total_steps": 7064, "loss": 0.8446, "reward": null, "learning_rate": 4.537338476322341e-05, "epoch": 0.39, "percentage": 19.68, "elapsed_time": "3:41:22", "remaining_time": "15:03:38"} +{"current_steps": 1390, "total_steps": 7064, "loss": 0.8446, "reward": null, "learning_rate": 4.537338476322341e-05, "epoch": 0.39, "percentage": 19.68, "elapsed_time": "3:41:21", "remaining_time": "15:03:34"} +{"current_steps": 1390, "total_steps": 7064, "loss": 0.8446, "reward": null, "learning_rate": 4.537338476322341e-05, "epoch": 0.39, "percentage": 19.68, "elapsed_time": "3:41:22", "remaining_time": "15:03:41"} +{"current_steps": 1400, "total_steps": 7064, "loss": 0.8524, "reward": null, "learning_rate": 4.530874706733502e-05, "epoch": 0.4, "percentage": 19.82, "elapsed_time": "3:46:51", "remaining_time": "15:17:48"} +{"current_steps": 1400, "total_steps": 7064, "loss": 0.8524, "reward": null, "learning_rate": 4.530874706733502e-05, "epoch": 0.4, "percentage": 19.82, "elapsed_time": "3:42:56", "remaining_time": "15:01:58"} +{"current_steps": 1400, "total_steps": 7064, "loss": 0.8524, "reward": null, "learning_rate": 4.530874706733502e-05, "epoch": 0.4, "percentage": 19.82, "elapsed_time": "3:42:58", "remaining_time": "15:02:05"} +{"current_steps": 1400, "total_steps": 7064, "loss": 0.8524, "reward": null, "learning_rate": 4.530874706733502e-05, "epoch": 0.4, "percentage": 19.82, "elapsed_time": "3:42:57", "remaining_time": "15:02:02"} +{"current_steps": 1410, "total_steps": 7064, "loss": 0.8417, "reward": null, "learning_rate": 4.524370769091866e-05, "epoch": 0.4, "percentage": 19.96, "elapsed_time": "3:48:27", "remaining_time": "15:16:05"} +{"current_steps": 1410, "total_steps": 7064, "loss": 0.8417, "reward": null, "learning_rate": 4.524370769091866e-05, "epoch": 0.4, "percentage": 19.96, "elapsed_time": "3:44:32", "remaining_time": "15:00:24"} +{"current_steps": 1410, "total_steps": 7064, "loss": 0.8417, "reward": null, "learning_rate": 4.524370769091866e-05, "epoch": 0.4, "percentage": 19.96, "elapsed_time": "3:44:34", "remaining_time": "15:00:31"} +{"current_steps": 1410, "total_steps": 7064, "loss": 0.8417, "reward": null, "learning_rate": 4.524370769091866e-05, "epoch": 0.4, "percentage": 19.96, "elapsed_time": "3:44:33", "remaining_time": "15:00:28"} +{"current_steps": 1420, "total_steps": 7064, "loss": 0.8582, "reward": null, "learning_rate": 4.5178267920368366e-05, "epoch": 0.4, "percentage": 20.1, "elapsed_time": "3:50:03", "remaining_time": "15:14:25"} +{"current_steps": 1420, "total_steps": 7064, "loss": 0.8582, "reward": null, "learning_rate": 4.5178267920368366e-05, "epoch": 0.4, "percentage": 20.1, "elapsed_time": "3:46:10", "remaining_time": "14:58:59"} +{"current_steps": 1420, "total_steps": 7064, "loss": 0.8582, "reward": null, "learning_rate": 4.5178267920368366e-05, "epoch": 0.4, "percentage": 20.1, "elapsed_time": "3:46:09", "remaining_time": "14:58:52"} +{"current_steps": 1420, "total_steps": 7064, "loss": 0.8582, "reward": null, "learning_rate": 4.5178267920368366e-05, "epoch": 0.4, "percentage": 20.1, "elapsed_time": "3:46:10", "remaining_time": "14:58:56"} +{"current_steps": 1430, "total_steps": 7064, "loss": 0.841, "reward": null, "learning_rate": 4.511242904999746e-05, "epoch": 0.4, "percentage": 20.24, "elapsed_time": "3:51:38", "remaining_time": "15:12:38"} +{"current_steps": 1430, "total_steps": 7064, "loss": 0.841, "reward": null, "learning_rate": 4.511242904999746e-05, "epoch": 0.4, "percentage": 20.24, "elapsed_time": "3:47:45", "remaining_time": "14:57:20"} +{"current_steps": 1430, "total_steps": 7064, "loss": 0.841, "reward": null, "learning_rate": 4.511242904999746e-05, "epoch": 0.4, "percentage": 20.24, "elapsed_time": "3:47:43", "remaining_time": "14:57:14"} +{"current_steps": 1430, "total_steps": 7064, "loss": 0.841, "reward": null, "learning_rate": 4.511242904999746e-05, "epoch": 0.4, "percentage": 20.24, "elapsed_time": "3:47:44", "remaining_time": "14:57:17"} +{"current_steps": 1440, "total_steps": 7064, "loss": 0.8529, "reward": null, "learning_rate": 4.50461923820129e-05, "epoch": 0.41, "percentage": 20.39, "elapsed_time": "3:53:16", "remaining_time": "15:11:03"} +{"current_steps": 1440, "total_steps": 7064, "loss": 0.8529, "reward": null, "learning_rate": 4.50461923820129e-05, "epoch": 0.41, "percentage": 20.39, "elapsed_time": "3:49:22", "remaining_time": "14:55:50"} +{"current_steps": 1440, "total_steps": 7064, "loss": 0.8529, "reward": null, "learning_rate": 4.50461923820129e-05, "epoch": 0.41, "percentage": 20.39, "elapsed_time": "3:49:21", "remaining_time": "14:55:47"} +{"current_steps": 1440, "total_steps": 7064, "loss": 0.8529, "reward": null, "learning_rate": 4.50461923820129e-05, "epoch": 0.41, "percentage": 20.39, "elapsed_time": "3:49:23", "remaining_time": "14:55:53"} +{"current_steps": 1450, "total_steps": 7064, "loss": 0.8545, "reward": null, "learning_rate": 4.497955922648961e-05, "epoch": 0.41, "percentage": 20.53, "elapsed_time": "3:54:55", "remaining_time": "15:09:35"} +{"current_steps": 1450, "total_steps": 7064, "loss": 0.8545, "reward": null, "learning_rate": 4.497955922648961e-05, "epoch": 0.41, "percentage": 20.53, "elapsed_time": "3:51:03", "remaining_time": "14:54:33"} +{"current_steps": 1450, "total_steps": 7064, "loss": 0.8545, "reward": null, "learning_rate": 4.497955922648961e-05, "epoch": 0.41, "percentage": 20.53, "elapsed_time": "3:51:01", "remaining_time": "14:54:27"} +{"current_steps": 1450, "total_steps": 7064, "loss": 0.8545, "reward": null, "learning_rate": 4.497955922648961e-05, "epoch": 0.41, "percentage": 20.53, "elapsed_time": "3:51:02", "remaining_time": "14:54:30"} +{"current_steps": 1460, "total_steps": 7064, "loss": 0.8471, "reward": null, "learning_rate": 4.491253090134447e-05, "epoch": 0.41, "percentage": 20.67, "elapsed_time": "3:56:33", "remaining_time": "15:07:59"} +{"current_steps": 1460, "total_steps": 7064, "loss": 0.8471, "reward": null, "learning_rate": 4.491253090134447e-05, "epoch": 0.41, "percentage": 20.67, "elapsed_time": "3:52:39", "remaining_time": "14:53:02"} +{"current_steps": 1460, "total_steps": 7064, "loss": 0.8471, "reward": null, "learning_rate": 4.491253090134447e-05, "epoch": 0.41, "percentage": 20.67, "elapsed_time": "3:52:40", "remaining_time": "14:53:05"} +{"current_steps": 1460, "total_steps": 7064, "loss": 0.8471, "reward": null, "learning_rate": 4.491253090134447e-05, "epoch": 0.41, "percentage": 20.67, "elapsed_time": "3:52:38", "remaining_time": "14:52:59"} +{"current_steps": 1470, "total_steps": 7064, "loss": 0.8379, "reward": null, "learning_rate": 4.4845108732310355e-05, "epoch": 0.42, "percentage": 20.81, "elapsed_time": "3:58:11", "remaining_time": "15:06:25"} +{"current_steps": 1470, "total_steps": 7064, "loss": 0.8379, "reward": null, "learning_rate": 4.4845108732310355e-05, "epoch": 0.42, "percentage": 20.81, "elapsed_time": "3:54:16", "remaining_time": "14:51:32"} +{"current_steps": 1470, "total_steps": 7064, "loss": 0.8379, "reward": null, "learning_rate": 4.4845108732310355e-05, "epoch": 0.42, "percentage": 20.81, "elapsed_time": "3:54:18", "remaining_time": "14:51:38"} +{"current_steps": 1470, "total_steps": 7064, "loss": 0.8379, "reward": null, "learning_rate": 4.4845108732310355e-05, "epoch": 0.42, "percentage": 20.81, "elapsed_time": "3:54:17", "remaining_time": "14:51:35"} +{"current_steps": 1480, "total_steps": 7064, "loss": 0.8542, "reward": null, "learning_rate": 4.4777294052909804e-05, "epoch": 0.42, "percentage": 20.95, "elapsed_time": "3:55:56", "remaining_time": "14:50:11"} +{"current_steps": 1480, "total_steps": 7064, "loss": 0.8542, "reward": null, "learning_rate": 4.4777294052909804e-05, "epoch": 0.42, "percentage": 20.95, "elapsed_time": "3:55:58", "remaining_time": "14:50:18"} +{"current_steps": 1480, "total_steps": 7064, "loss": 0.8542, "reward": null, "learning_rate": 4.4777294052909804e-05, "epoch": 0.42, "percentage": 20.95, "elapsed_time": "3:55:57", "remaining_time": "14:50:15"} +{"current_steps": 1480, "total_steps": 7064, "loss": 0.8542, "reward": null, "learning_rate": 4.4777294052909804e-05, "epoch": 0.42, "percentage": 20.95, "elapsed_time": "3:59:51", "remaining_time": "15:04:56"} +{"current_steps": 1490, "total_steps": 7064, "loss": 0.8463, "reward": null, "learning_rate": 4.470908820442873e-05, "epoch": 0.42, "percentage": 21.09, "elapsed_time": "3:57:31", "remaining_time": "14:48:33"} +{"current_steps": 1490, "total_steps": 7064, "loss": 0.8463, "reward": null, "learning_rate": 4.470908820442873e-05, "epoch": 0.42, "percentage": 21.09, "elapsed_time": "4:01:25", "remaining_time": "15:03:07"} +{"current_steps": 1490, "total_steps": 7064, "loss": 0.8463, "reward": null, "learning_rate": 4.470908820442873e-05, "epoch": 0.42, "percentage": 21.09, "elapsed_time": "3:57:30", "remaining_time": "14:48:30"} +{"current_steps": 1490, "total_steps": 7064, "loss": 0.8463, "reward": null, "learning_rate": 4.470908820442873e-05, "epoch": 0.42, "percentage": 21.09, "elapsed_time": "3:57:32", "remaining_time": "14:48:36"} +{"current_steps": 1500, "total_steps": 7064, "loss": 0.8362, "reward": null, "learning_rate": 4.464049253588985e-05, "epoch": 0.42, "percentage": 21.23, "elapsed_time": "3:59:04", "remaining_time": "14:46:50"} +{"current_steps": 1500, "total_steps": 7064, "loss": 0.8362, "reward": null, "learning_rate": 4.464049253588985e-05, "epoch": 0.42, "percentage": 21.23, "elapsed_time": "3:59:06", "remaining_time": "14:46:56"} +{"current_steps": 1500, "total_steps": 7064, "loss": 0.8362, "reward": null, "learning_rate": 4.464049253588985e-05, "epoch": 0.42, "percentage": 21.23, "elapsed_time": "3:59:05", "remaining_time": "14:46:53"} +{"current_steps": 1500, "total_steps": 7064, "loss": 0.8362, "reward": null, "learning_rate": 4.464049253588985e-05, "epoch": 0.42, "percentage": 21.23, "elapsed_time": "4:02:59", "remaining_time": "15:01:20"} +{"current_steps": 1510, "total_steps": 7064, "loss": 0.8467, "reward": null, "learning_rate": 4.457150840402604e-05, "epoch": 0.43, "percentage": 21.38, "elapsed_time": "4:04:38", "remaining_time": "14:59:48"} +{"current_steps": 1510, "total_steps": 7064, "loss": 0.8467, "reward": null, "learning_rate": 4.457150840402604e-05, "epoch": 0.43, "percentage": 21.38, "elapsed_time": "4:00:45", "remaining_time": "14:45:31"} +{"current_steps": 1510, "total_steps": 7064, "loss": 0.8467, "reward": null, "learning_rate": 4.457150840402604e-05, "epoch": 0.43, "percentage": 21.38, "elapsed_time": "4:00:43", "remaining_time": "14:45:25"} +{"current_steps": 1510, "total_steps": 7064, "loss": 0.8467, "reward": null, "learning_rate": 4.457150840402604e-05, "epoch": 0.43, "percentage": 21.38, "elapsed_time": "4:00:44", "remaining_time": "14:45:28"} +{"current_steps": 1520, "total_steps": 7064, "loss": 0.8501, "reward": null, "learning_rate": 4.450213717325343e-05, "epoch": 0.43, "percentage": 21.52, "elapsed_time": "4:06:15", "remaining_time": "14:58:11"} +{"current_steps": 1520, "total_steps": 7064, "loss": 0.8501, "reward": null, "learning_rate": 4.450213717325343e-05, "epoch": 0.43, "percentage": 21.52, "elapsed_time": "4:02:20", "remaining_time": "14:43:55"} +{"current_steps": 1520, "total_steps": 7064, "loss": 0.8501, "reward": null, "learning_rate": 4.450213717325343e-05, "epoch": 0.43, "percentage": 21.52, "elapsed_time": "4:02:22", "remaining_time": "14:44:01"} +{"current_steps": 1520, "total_steps": 7064, "loss": 0.8501, "reward": null, "learning_rate": 4.450213717325343e-05, "epoch": 0.43, "percentage": 21.52, "elapsed_time": "4:02:21", "remaining_time": "14:43:58"} +{"current_steps": 1530, "total_steps": 7064, "loss": 0.8541, "reward": null, "learning_rate": 4.443238021564448e-05, "epoch": 0.43, "percentage": 21.66, "elapsed_time": "4:04:00", "remaining_time": "14:42:33"} +{"current_steps": 1530, "total_steps": 7064, "loss": 0.8541, "reward": null, "learning_rate": 4.443238021564448e-05, "epoch": 0.43, "percentage": 21.66, "elapsed_time": "4:07:53", "remaining_time": "14:56:35"} +{"current_steps": 1530, "total_steps": 7064, "loss": 0.8541, "reward": null, "learning_rate": 4.443238021564448e-05, "epoch": 0.43, "percentage": 21.66, "elapsed_time": "4:03:58", "remaining_time": "14:42:27"} +{"current_steps": 1530, "total_steps": 7064, "loss": 0.8541, "reward": null, "learning_rate": 4.443238021564448e-05, "epoch": 0.43, "percentage": 21.66, "elapsed_time": "4:03:59", "remaining_time": "14:42:30"} +{"current_steps": 1540, "total_steps": 7064, "loss": 0.8443, "reward": null, "learning_rate": 4.4362238910900835e-05, "epoch": 0.44, "percentage": 21.8, "elapsed_time": "4:09:28", "remaining_time": "14:54:51"} +{"current_steps": 1540, "total_steps": 7064, "loss": 0.8443, "reward": null, "learning_rate": 4.4362238910900835e-05, "epoch": 0.44, "percentage": 21.8, "elapsed_time": "4:05:34", "remaining_time": "14:40:53"} +{"current_steps": 1540, "total_steps": 7064, "loss": 0.8443, "reward": null, "learning_rate": 4.4362238910900835e-05, "epoch": 0.44, "percentage": 21.8, "elapsed_time": "4:05:33", "remaining_time": "14:40:49"} +{"current_steps": 1540, "total_steps": 7064, "loss": 0.8443, "reward": null, "learning_rate": 4.4362238910900835e-05, "epoch": 0.44, "percentage": 21.8, "elapsed_time": "4:05:35", "remaining_time": "14:40:55"} +{"current_steps": 1550, "total_steps": 7064, "loss": 0.8297, "reward": null, "learning_rate": 4.4291714646326024e-05, "epoch": 0.44, "percentage": 21.94, "elapsed_time": "4:11:04", "remaining_time": "14:53:12"} +{"current_steps": 1550, "total_steps": 7064, "loss": 0.8297, "reward": null, "learning_rate": 4.4291714646326024e-05, "epoch": 0.44, "percentage": 21.94, "elapsed_time": "4:07:11", "remaining_time": "14:39:23"} +{"current_steps": 1550, "total_steps": 7064, "loss": 0.8297, "reward": null, "learning_rate": 4.4291714646326024e-05, "epoch": 0.44, "percentage": 21.94, "elapsed_time": "4:07:10", "remaining_time": "14:39:17"} +{"current_steps": 1550, "total_steps": 7064, "loss": 0.8297, "reward": null, "learning_rate": 4.4291714646326024e-05, "epoch": 0.44, "percentage": 21.94, "elapsed_time": "4:07:11", "remaining_time": "14:39:20"} +{"current_steps": 1560, "total_steps": 7064, "loss": 0.8532, "reward": null, "learning_rate": 4.4220808816797995e-05, "epoch": 0.44, "percentage": 22.08, "elapsed_time": "4:08:50", "remaining_time": "14:37:58"} +{"current_steps": 1560, "total_steps": 7064, "loss": 0.8532, "reward": null, "learning_rate": 4.4220808816797995e-05, "epoch": 0.44, "percentage": 22.08, "elapsed_time": "4:12:45", "remaining_time": "14:51:46"} +{"current_steps": 1560, "total_steps": 7064, "loss": 0.8532, "reward": null, "learning_rate": 4.4220808816797995e-05, "epoch": 0.44, "percentage": 22.08, "elapsed_time": "4:08:51", "remaining_time": "14:38:01"} +{"current_steps": 1560, "total_steps": 7064, "loss": 0.8532, "reward": null, "learning_rate": 4.4220808816797995e-05, "epoch": 0.44, "percentage": 22.08, "elapsed_time": "4:08:52", "remaining_time": "14:38:04"} +{"current_steps": 1570, "total_steps": 7064, "loss": 0.854, "reward": null, "learning_rate": 4.414952282474158e-05, "epoch": 0.44, "percentage": 22.23, "elapsed_time": "4:14:22", "remaining_time": "14:50:09"} +{"current_steps": 1570, "total_steps": 7064, "loss": 0.854, "reward": null, "learning_rate": 4.414952282474158e-05, "epoch": 0.44, "percentage": 22.23, "elapsed_time": "4:10:28", "remaining_time": "14:36:31"} +{"current_steps": 1570, "total_steps": 7064, "loss": 0.854, "reward": null, "learning_rate": 4.414952282474158e-05, "epoch": 0.44, "percentage": 22.23, "elapsed_time": "4:10:28", "remaining_time": "14:36:28"} +{"current_steps": 1570, "total_steps": 7064, "loss": 0.854, "reward": null, "learning_rate": 4.414952282474158e-05, "epoch": 0.44, "percentage": 22.23, "elapsed_time": "4:10:29", "remaining_time": "14:36:34"} +{"current_steps": 1580, "total_steps": 7064, "loss": 0.849, "reward": null, "learning_rate": 4.407785808010073e-05, "epoch": 0.45, "percentage": 22.37, "elapsed_time": "4:12:06", "remaining_time": "14:35:02"} +{"current_steps": 1580, "total_steps": 7064, "loss": 0.849, "reward": null, "learning_rate": 4.407785808010073e-05, "epoch": 0.45, "percentage": 22.37, "elapsed_time": "4:12:05", "remaining_time": "14:34:59"} +{"current_steps": 1580, "total_steps": 7064, "loss": 0.849, "reward": null, "learning_rate": 4.407785808010073e-05, "epoch": 0.45, "percentage": 22.37, "elapsed_time": "4:12:07", "remaining_time": "14:35:05"} +{"current_steps": 1580, "total_steps": 7064, "loss": 0.849, "reward": null, "learning_rate": 4.407785808010073e-05, "epoch": 0.45, "percentage": 22.37, "elapsed_time": "4:16:00", "remaining_time": "14:48:33"} +{"current_steps": 1590, "total_steps": 7064, "loss": 0.8516, "reward": null, "learning_rate": 4.400581600031062e-05, "epoch": 0.45, "percentage": 22.51, "elapsed_time": "4:17:37", "remaining_time": "14:46:55"} +{"current_steps": 1590, "total_steps": 7064, "loss": 0.8516, "reward": null, "learning_rate": 4.400581600031062e-05, "epoch": 0.45, "percentage": 22.51, "elapsed_time": "4:13:44", "remaining_time": "14:33:33"} +{"current_steps": 1590, "total_steps": 7064, "loss": 0.8516, "reward": null, "learning_rate": 4.400581600031062e-05, "epoch": 0.45, "percentage": 22.51, "elapsed_time": "4:13:42", "remaining_time": "14:33:27"} +{"current_steps": 1590, "total_steps": 7064, "loss": 0.8516, "reward": null, "learning_rate": 4.400581600031062e-05, "epoch": 0.45, "percentage": 22.51, "elapsed_time": "4:13:43", "remaining_time": "14:33:30"} +{"current_steps": 1600, "total_steps": 7064, "loss": 0.8394, "reward": null, "learning_rate": 4.3933398010269614e-05, "epoch": 0.45, "percentage": 22.65, "elapsed_time": "4:19:14", "remaining_time": "14:45:19"} +{"current_steps": 1600, "total_steps": 7064, "loss": 0.8394, "reward": null, "learning_rate": 4.3933398010269614e-05, "epoch": 0.45, "percentage": 22.65, "elapsed_time": "4:15:21", "remaining_time": "14:32:03"} +{"current_steps": 1600, "total_steps": 7064, "loss": 0.8394, "reward": null, "learning_rate": 4.3933398010269614e-05, "epoch": 0.45, "percentage": 22.65, "elapsed_time": "4:15:20", "remaining_time": "14:31:58"} +{"current_steps": 1600, "total_steps": 7064, "loss": 0.8394, "reward": null, "learning_rate": 4.3933398010269614e-05, "epoch": 0.45, "percentage": 22.65, "elapsed_time": "4:15:20", "remaining_time": "14:32:01"} +{"current_steps": 1610, "total_steps": 7064, "loss": 0.8399, "reward": null, "learning_rate": 4.386060554231111e-05, "epoch": 0.46, "percentage": 22.79, "elapsed_time": "4:20:52", "remaining_time": "14:43:44"} +{"current_steps": 1610, "total_steps": 7064, "loss": 0.8399, "reward": null, "learning_rate": 4.386060554231111e-05, "epoch": 0.46, "percentage": 22.79, "elapsed_time": "4:16:58", "remaining_time": "14:30:32"} +{"current_steps": 1610, "total_steps": 7064, "loss": 0.8399, "reward": null, "learning_rate": 4.386060554231111e-05, "epoch": 0.46, "percentage": 22.79, "elapsed_time": "4:16:57", "remaining_time": "14:30:29"} +{"current_steps": 1610, "total_steps": 7064, "loss": 0.8399, "reward": null, "learning_rate": 4.386060554231111e-05, "epoch": 0.46, "percentage": 22.79, "elapsed_time": "4:16:59", "remaining_time": "14:30:35"} +{"current_steps": 1620, "total_steps": 7064, "loss": 0.8242, "reward": null, "learning_rate": 4.378744003617517e-05, "epoch": 0.46, "percentage": 22.93, "elapsed_time": "4:18:41", "remaining_time": "14:29:20"} +{"current_steps": 1620, "total_steps": 7064, "loss": 0.8242, "reward": null, "learning_rate": 4.378744003617517e-05, "epoch": 0.46, "percentage": 22.93, "elapsed_time": "4:18:42", "remaining_time": "14:29:22"} +{"current_steps": 1620, "total_steps": 7064, "loss": 0.8242, "reward": null, "learning_rate": 4.378744003617517e-05, "epoch": 0.46, "percentage": 22.93, "elapsed_time": "4:18:40", "remaining_time": "14:29:16"} +{"current_steps": 1620, "total_steps": 7064, "loss": 0.8242, "reward": null, "learning_rate": 4.378744003617517e-05, "epoch": 0.46, "percentage": 22.93, "elapsed_time": "4:22:35", "remaining_time": "14:42:25"} +{"current_steps": 1630, "total_steps": 7064, "loss": 0.8395, "reward": null, "learning_rate": 4.371390293898007e-05, "epoch": 0.46, "percentage": 23.07, "elapsed_time": "4:20:22", "remaining_time": "14:28:00"} +{"current_steps": 1630, "total_steps": 7064, "loss": 0.8395, "reward": null, "learning_rate": 4.371390293898007e-05, "epoch": 0.46, "percentage": 23.07, "elapsed_time": "4:20:21", "remaining_time": "14:27:57"} +{"current_steps": 1630, "total_steps": 7064, "loss": 0.8395, "reward": null, "learning_rate": 4.371390293898007e-05, "epoch": 0.46, "percentage": 23.07, "elapsed_time": "4:20:20", "remaining_time": "14:27:54"} +{"current_steps": 1630, "total_steps": 7064, "loss": 0.8395, "reward": null, "learning_rate": 4.371390293898007e-05, "epoch": 0.46, "percentage": 23.07, "elapsed_time": "4:24:15", "remaining_time": "14:40:56"} +{"current_steps": 1640, "total_steps": 7064, "loss": 0.8355, "reward": null, "learning_rate": 4.3639995705193684e-05, "epoch": 0.46, "percentage": 23.22, "elapsed_time": "4:22:00", "remaining_time": "14:26:32"} +{"current_steps": 1640, "total_steps": 7064, "loss": 0.8355, "reward": null, "learning_rate": 4.3639995705193684e-05, "epoch": 0.46, "percentage": 23.22, "elapsed_time": "4:25:53", "remaining_time": "14:39:22"} +{"current_steps": 1640, "total_steps": 7064, "loss": 0.8355, "reward": null, "learning_rate": 4.3639995705193684e-05, "epoch": 0.46, "percentage": 23.22, "elapsed_time": "4:21:58", "remaining_time": "14:26:26"} +{"current_steps": 1640, "total_steps": 7064, "loss": 0.8355, "reward": null, "learning_rate": 4.3639995705193684e-05, "epoch": 0.46, "percentage": 23.22, "elapsed_time": "4:21:59", "remaining_time": "14:26:29"} +{"current_steps": 1650, "total_steps": 7064, "loss": 0.8299, "reward": null, "learning_rate": 4.3565719796604706e-05, "epoch": 0.47, "percentage": 23.36, "elapsed_time": "4:23:35", "remaining_time": "14:24:53"} +{"current_steps": 1650, "total_steps": 7064, "loss": 0.8299, "reward": null, "learning_rate": 4.3565719796604706e-05, "epoch": 0.47, "percentage": 23.36, "elapsed_time": "4:23:36", "remaining_time": "14:24:58"} +{"current_steps": 1650, "total_steps": 7064, "loss": 0.8299, "reward": null, "learning_rate": 4.3565719796604706e-05, "epoch": 0.47, "percentage": 23.36, "elapsed_time": "4:23:36", "remaining_time": "14:24:56"} +{"current_steps": 1650, "total_steps": 7064, "loss": 0.8299, "reward": null, "learning_rate": 4.3565719796604706e-05, "epoch": 0.47, "percentage": 23.36, "elapsed_time": "4:27:29", "remaining_time": "14:37:42"} +{"current_steps": 1660, "total_steps": 7064, "loss": 0.8272, "reward": null, "learning_rate": 4.3491076682293715e-05, "epoch": 0.47, "percentage": 23.5, "elapsed_time": "4:29:08", "remaining_time": "14:36:11"} +{"current_steps": 1660, "total_steps": 7064, "loss": 0.8272, "reward": null, "learning_rate": 4.3491076682293715e-05, "epoch": 0.47, "percentage": 23.5, "elapsed_time": "4:25:15", "remaining_time": "14:23:30"} +{"current_steps": 1660, "total_steps": 7064, "loss": 0.8272, "reward": null, "learning_rate": 4.3491076682293715e-05, "epoch": 0.47, "percentage": 23.5, "elapsed_time": "4:25:14", "remaining_time": "14:23:27"} +{"current_steps": 1660, "total_steps": 7064, "loss": 0.8272, "reward": null, "learning_rate": 4.3491076682293715e-05, "epoch": 0.47, "percentage": 23.5, "elapsed_time": "4:25:15", "remaining_time": "14:23:32"} +{"current_steps": 1670, "total_steps": 7064, "loss": 0.8336, "reward": null, "learning_rate": 4.341606783860416e-05, "epoch": 0.47, "percentage": 23.64, "elapsed_time": "4:26:52", "remaining_time": "14:22:00"} +{"current_steps": 1670, "total_steps": 7064, "loss": 0.8336, "reward": null, "learning_rate": 4.341606783860416e-05, "epoch": 0.47, "percentage": 23.64, "elapsed_time": "4:30:45", "remaining_time": "14:34:33"} +{"current_steps": 1670, "total_steps": 7064, "loss": 0.8336, "reward": null, "learning_rate": 4.341606783860416e-05, "epoch": 0.47, "percentage": 23.64, "elapsed_time": "4:26:51", "remaining_time": "14:21:55"} +{"current_steps": 1670, "total_steps": 7064, "loss": 0.8336, "reward": null, "learning_rate": 4.341606783860416e-05, "epoch": 0.47, "percentage": 23.64, "elapsed_time": "4:26:52", "remaining_time": "14:21:58"} +{"current_steps": 1680, "total_steps": 7064, "loss": 0.8264, "reward": null, "learning_rate": 4.334069474911313e-05, "epoch": 0.48, "percentage": 23.78, "elapsed_time": "4:32:22", "remaining_time": "14:32:54"} +{"current_steps": 1680, "total_steps": 7064, "loss": 0.8264, "reward": null, "learning_rate": 4.334069474911313e-05, "epoch": 0.48, "percentage": 23.78, "elapsed_time": "4:28:29", "remaining_time": "14:20:25"} +{"current_steps": 1680, "total_steps": 7064, "loss": 0.8264, "reward": null, "learning_rate": 4.334069474911313e-05, "epoch": 0.48, "percentage": 23.78, "elapsed_time": "4:28:28", "remaining_time": "14:20:22"} +{"current_steps": 1680, "total_steps": 7064, "loss": 0.8264, "reward": null, "learning_rate": 4.334069474911313e-05, "epoch": 0.48, "percentage": 23.78, "elapsed_time": "4:28:29", "remaining_time": "14:20:28"} +{"current_steps": 1690, "total_steps": 7064, "loss": 0.8381, "reward": null, "learning_rate": 4.326495890460204e-05, "epoch": 0.48, "percentage": 23.92, "elapsed_time": "4:33:59", "remaining_time": "14:31:14"} +{"current_steps": 1690, "total_steps": 7064, "loss": 0.8381, "reward": null, "learning_rate": 4.326495890460204e-05, "epoch": 0.48, "percentage": 23.92, "elapsed_time": "4:30:04", "remaining_time": "14:18:48"} +{"current_steps": 1690, "total_steps": 7064, "loss": 0.8381, "reward": null, "learning_rate": 4.326495890460204e-05, "epoch": 0.48, "percentage": 23.92, "elapsed_time": "4:30:06", "remaining_time": "14:18:54"} +{"current_steps": 1690, "total_steps": 7064, "loss": 0.8381, "reward": null, "learning_rate": 4.326495890460204e-05, "epoch": 0.48, "percentage": 23.92, "elapsed_time": "4:30:05", "remaining_time": "14:18:51"} +{"current_steps": 1700, "total_steps": 7064, "loss": 0.8278, "reward": null, "learning_rate": 4.3188861803027094e-05, "epoch": 0.48, "percentage": 24.07, "elapsed_time": "4:31:42", "remaining_time": "14:17:19"} +{"current_steps": 1700, "total_steps": 7064, "loss": 0.8278, "reward": null, "learning_rate": 4.3188861803027094e-05, "epoch": 0.48, "percentage": 24.07, "elapsed_time": "4:31:40", "remaining_time": "14:17:13"} +{"current_steps": 1700, "total_steps": 7064, "loss": 0.8278, "reward": null, "learning_rate": 4.3188861803027094e-05, "epoch": 0.48, "percentage": 24.07, "elapsed_time": "4:31:41", "remaining_time": "14:17:16"} +{"current_steps": 1700, "total_steps": 7064, "loss": 0.8278, "reward": null, "learning_rate": 4.3188861803027094e-05, "epoch": 0.48, "percentage": 24.07, "elapsed_time": "4:35:35", "remaining_time": "14:29:34"} +{"current_steps": 1710, "total_steps": 7064, "loss": 0.8458, "reward": null, "learning_rate": 4.3112404949489715e-05, "epoch": 0.48, "percentage": 24.21, "elapsed_time": "4:33:17", "remaining_time": "14:15:40"} +{"current_steps": 1710, "total_steps": 7064, "loss": 0.8458, "reward": null, "learning_rate": 4.3112404949489715e-05, "epoch": 0.48, "percentage": 24.21, "elapsed_time": "4:33:18", "remaining_time": "14:15:43"} +{"current_steps": 1710, "total_steps": 7064, "loss": 0.8458, "reward": null, "learning_rate": 4.3112404949489715e-05, "epoch": 0.48, "percentage": 24.21, "elapsed_time": "4:33:16", "remaining_time": "14:15:38"} +{"current_steps": 1710, "total_steps": 7064, "loss": 0.8458, "reward": null, "learning_rate": 4.3112404949489715e-05, "epoch": 0.48, "percentage": 24.21, "elapsed_time": "4:37:11", "remaining_time": "14:27:52"} +{"current_steps": 1720, "total_steps": 7064, "loss": 0.8348, "reward": null, "learning_rate": 4.303558985620673e-05, "epoch": 0.49, "percentage": 24.35, "elapsed_time": "4:38:48", "remaining_time": "14:26:13"} +{"current_steps": 1720, "total_steps": 7064, "loss": 0.8348, "reward": null, "learning_rate": 4.303558985620673e-05, "epoch": 0.49, "percentage": 24.35, "elapsed_time": "4:34:55", "remaining_time": "14:14:10"} +{"current_steps": 1720, "total_steps": 7064, "loss": 0.8348, "reward": null, "learning_rate": 4.303558985620673e-05, "epoch": 0.49, "percentage": 24.35, "elapsed_time": "4:34:53", "remaining_time": "14:14:04"} +{"current_steps": 1720, "total_steps": 7064, "loss": 0.8348, "reward": null, "learning_rate": 4.303558985620673e-05, "epoch": 0.49, "percentage": 24.35, "elapsed_time": "4:34:54", "remaining_time": "14:14:07"} +{"current_steps": 1730, "total_steps": 7064, "loss": 0.814, "reward": null, "learning_rate": 4.2958418042480506e-05, "epoch": 0.49, "percentage": 24.49, "elapsed_time": "4:40:22", "remaining_time": "14:24:26"} +{"current_steps": 1730, "total_steps": 7064, "loss": 0.814, "reward": null, "learning_rate": 4.2958418042480506e-05, "epoch": 0.49, "percentage": 24.49, "elapsed_time": "4:36:29", "remaining_time": "14:12:28"} +{"current_steps": 1730, "total_steps": 7064, "loss": 0.814, "reward": null, "learning_rate": 4.2958418042480506e-05, "epoch": 0.49, "percentage": 24.49, "elapsed_time": "4:36:27", "remaining_time": "14:12:22"} +{"current_steps": 1730, "total_steps": 7064, "loss": 0.814, "reward": null, "learning_rate": 4.2958418042480506e-05, "epoch": 0.49, "percentage": 24.49, "elapsed_time": "4:36:28", "remaining_time": "14:12:25"} +{"current_steps": 1740, "total_steps": 7064, "loss": 0.838, "reward": null, "learning_rate": 4.288089103466886e-05, "epoch": 0.49, "percentage": 24.63, "elapsed_time": "4:41:59", "remaining_time": "14:22:50"} +{"current_steps": 1740, "total_steps": 7064, "loss": 0.838, "reward": null, "learning_rate": 4.288089103466886e-05, "epoch": 0.49, "percentage": 24.63, "elapsed_time": "4:38:06", "remaining_time": "14:10:58"} +{"current_steps": 1740, "total_steps": 7064, "loss": 0.838, "reward": null, "learning_rate": 4.288089103466886e-05, "epoch": 0.49, "percentage": 24.63, "elapsed_time": "4:38:06", "remaining_time": "14:10:55"} +{"current_steps": 1740, "total_steps": 7064, "loss": 0.838, "reward": null, "learning_rate": 4.288089103466886e-05, "epoch": 0.49, "percentage": 24.63, "elapsed_time": "4:38:05", "remaining_time": "14:10:53"} +{"current_steps": 1750, "total_steps": 7064, "loss": 0.824, "reward": null, "learning_rate": 4.280301036615489e-05, "epoch": 0.5, "percentage": 24.77, "elapsed_time": "4:39:40", "remaining_time": "14:09:13"} +{"current_steps": 1750, "total_steps": 7064, "loss": 0.824, "reward": null, "learning_rate": 4.280301036615489e-05, "epoch": 0.5, "percentage": 24.77, "elapsed_time": "4:39:41", "remaining_time": "14:09:18"} +{"current_steps": 1750, "total_steps": 7064, "loss": 0.824, "reward": null, "learning_rate": 4.280301036615489e-05, "epoch": 0.5, "percentage": 24.77, "elapsed_time": "4:43:34", "remaining_time": "14:21:06"} +{"current_steps": 1750, "total_steps": 7064, "loss": 0.824, "reward": null, "learning_rate": 4.280301036615489e-05, "epoch": 0.5, "percentage": 24.77, "elapsed_time": "4:39:40", "remaining_time": "14:09:16"} +{"current_steps": 1760, "total_steps": 7064, "loss": 0.8314, "reward": null, "learning_rate": 4.272477757731662e-05, "epoch": 0.5, "percentage": 24.92, "elapsed_time": "4:41:17", "remaining_time": "14:07:41"} +{"current_steps": 1760, "total_steps": 7064, "loss": 0.8314, "reward": null, "learning_rate": 4.272477757731662e-05, "epoch": 0.5, "percentage": 24.92, "elapsed_time": "4:41:16", "remaining_time": "14:07:38"} +{"current_steps": 1760, "total_steps": 7064, "loss": 0.8314, "reward": null, "learning_rate": 4.272477757731662e-05, "epoch": 0.5, "percentage": 24.92, "elapsed_time": "4:41:15", "remaining_time": "14:07:36"} +{"current_steps": 1760, "total_steps": 7064, "loss": 0.8314, "reward": null, "learning_rate": 4.272477757731662e-05, "epoch": 0.5, "percentage": 24.92, "elapsed_time": "4:45:09", "remaining_time": "14:19:23"} +{"current_steps": 1770, "total_steps": 7064, "loss": 0.821, "reward": null, "learning_rate": 4.2646194215496595e-05, "epoch": 0.5, "percentage": 25.06, "elapsed_time": "4:46:45", "remaining_time": "14:17:42"} +{"current_steps": 1770, "total_steps": 7064, "loss": 0.821, "reward": null, "learning_rate": 4.2646194215496595e-05, "epoch": 0.5, "percentage": 25.06, "elapsed_time": "4:42:51", "remaining_time": "14:06:00"} +{"current_steps": 1770, "total_steps": 7064, "loss": 0.821, "reward": null, "learning_rate": 4.2646194215496595e-05, "epoch": 0.5, "percentage": 25.06, "elapsed_time": "4:42:52", "remaining_time": "14:06:03"} +{"current_steps": 1770, "total_steps": 7064, "loss": 0.821, "reward": null, "learning_rate": 4.2646194215496595e-05, "epoch": 0.5, "percentage": 25.06, "elapsed_time": "4:42:52", "remaining_time": "14:06:05"} +{"current_steps": 1780, "total_steps": 7064, "loss": 0.8311, "reward": null, "learning_rate": 4.2567261834971206e-05, "epoch": 0.5, "percentage": 25.2, "elapsed_time": "4:44:28", "remaining_time": "14:04:27"} +{"current_steps": 1780, "total_steps": 7064, "loss": 0.8311, "reward": null, "learning_rate": 4.2567261834971206e-05, "epoch": 0.5, "percentage": 25.2, "elapsed_time": "4:48:21", "remaining_time": "14:15:58"} +{"current_steps": 1780, "total_steps": 7064, "loss": 0.8311, "reward": null, "learning_rate": 4.2567261834971206e-05, "epoch": 0.5, "percentage": 25.2, "elapsed_time": "4:44:27", "remaining_time": "14:04:25"} +{"current_steps": 1780, "total_steps": 7064, "loss": 0.8311, "reward": null, "learning_rate": 4.2567261834971206e-05, "epoch": 0.5, "percentage": 25.2, "elapsed_time": "4:44:26", "remaining_time": "14:04:22"} +{"current_steps": 1790, "total_steps": 7064, "loss": 0.8443, "reward": null, "learning_rate": 4.248798199691998e-05, "epoch": 0.51, "percentage": 25.34, "elapsed_time": "4:49:58", "remaining_time": "14:14:21"} +{"current_steps": 1790, "total_steps": 7064, "loss": 0.8443, "reward": null, "learning_rate": 4.248798199691998e-05, "epoch": 0.51, "percentage": 25.34, "elapsed_time": "4:46:05", "remaining_time": "14:02:54"} +{"current_steps": 1790, "total_steps": 7064, "loss": 0.8443, "reward": null, "learning_rate": 4.248798199691998e-05, "epoch": 0.51, "percentage": 25.34, "elapsed_time": "4:46:04", "remaining_time": "14:02:52"} +{"current_steps": 1790, "total_steps": 7064, "loss": 0.8443, "reward": null, "learning_rate": 4.248798199691998e-05, "epoch": 0.51, "percentage": 25.34, "elapsed_time": "4:46:03", "remaining_time": "14:02:49"} +{"current_steps": 1800, "total_steps": 7064, "loss": 0.8315, "reward": null, "learning_rate": 4.2408356269394714e-05, "epoch": 0.51, "percentage": 25.48, "elapsed_time": "4:47:41", "remaining_time": "14:01:20"} +{"current_steps": 1800, "total_steps": 7064, "loss": 0.8315, "reward": null, "learning_rate": 4.2408356269394714e-05, "epoch": 0.51, "percentage": 25.48, "elapsed_time": "4:47:42", "remaining_time": "14:01:22"} +{"current_steps": 1800, "total_steps": 7064, "loss": 0.8315, "reward": null, "learning_rate": 4.2408356269394714e-05, "epoch": 0.51, "percentage": 25.48, "elapsed_time": "4:47:40", "remaining_time": "14:01:17"} +{"current_steps": 1800, "total_steps": 7064, "loss": 0.8315, "reward": null, "learning_rate": 4.2408356269394714e-05, "epoch": 0.51, "percentage": 25.48, "elapsed_time": "4:51:35", "remaining_time": "14:12:43"} +{"current_steps": 1810, "total_steps": 7064, "loss": 0.8184, "reward": null, "learning_rate": 4.2328386227288445e-05, "epoch": 0.51, "percentage": 25.62, "elapsed_time": "4:53:12", "remaining_time": "14:11:06"} +{"current_steps": 1810, "total_steps": 7064, "loss": 0.8184, "reward": null, "learning_rate": 4.2328386227288445e-05, "epoch": 0.51, "percentage": 25.62, "elapsed_time": "4:49:17", "remaining_time": "13:59:45"} +{"current_steps": 1810, "total_steps": 7064, "loss": 0.8184, "reward": null, "learning_rate": 4.2328386227288445e-05, "epoch": 0.51, "percentage": 25.62, "elapsed_time": "4:49:19", "remaining_time": "13:59:50"} +{"current_steps": 1810, "total_steps": 7064, "loss": 0.8184, "reward": null, "learning_rate": 4.2328386227288445e-05, "epoch": 0.51, "percentage": 25.62, "elapsed_time": "4:49:18", "remaining_time": "13:59:47"} +{"current_steps": 1820, "total_steps": 7064, "loss": 0.8364, "reward": null, "learning_rate": 4.224807345230429e-05, "epoch": 0.52, "percentage": 25.76, "elapsed_time": "4:54:49", "remaining_time": "14:09:28"} +{"current_steps": 1820, "total_steps": 7064, "loss": 0.8364, "reward": null, "learning_rate": 4.224807345230429e-05, "epoch": 0.52, "percentage": 25.76, "elapsed_time": "4:50:56", "remaining_time": "13:58:17"} +{"current_steps": 1820, "total_steps": 7064, "loss": 0.8364, "reward": null, "learning_rate": 4.224807345230429e-05, "epoch": 0.52, "percentage": 25.76, "elapsed_time": "4:50:54", "remaining_time": "13:58:12"} +{"current_steps": 1820, "total_steps": 7064, "loss": 0.8364, "reward": null, "learning_rate": 4.224807345230429e-05, "epoch": 0.52, "percentage": 25.76, "elapsed_time": "4:50:55", "remaining_time": "13:58:14"} +{"current_steps": 1830, "total_steps": 7064, "loss": 0.8186, "reward": null, "learning_rate": 4.21674195329242e-05, "epoch": 0.52, "percentage": 25.91, "elapsed_time": "4:56:27", "remaining_time": "14:07:54"} +{"current_steps": 1830, "total_steps": 7064, "loss": 0.8186, "reward": null, "learning_rate": 4.21674195329242e-05, "epoch": 0.52, "percentage": 25.91, "elapsed_time": "4:52:33", "remaining_time": "13:56:46"} +{"current_steps": 1830, "total_steps": 7064, "loss": 0.8186, "reward": null, "learning_rate": 4.21674195329242e-05, "epoch": 0.52, "percentage": 25.91, "elapsed_time": "4:52:34", "remaining_time": "13:56:48"} +{"current_steps": 1830, "total_steps": 7064, "loss": 0.8186, "reward": null, "learning_rate": 4.21674195329242e-05, "epoch": 0.52, "percentage": 25.91, "elapsed_time": "4:52:33", "remaining_time": "13:56:43"} +{"current_steps": 1840, "total_steps": 7064, "loss": 0.8454, "reward": null, "learning_rate": 4.208642606437748e-05, "epoch": 0.52, "percentage": 26.05, "elapsed_time": "4:58:05", "remaining_time": "14:06:18"} +{"current_steps": 1840, "total_steps": 7064, "loss": 0.8454, "reward": null, "learning_rate": 4.208642606437748e-05, "epoch": 0.52, "percentage": 26.05, "elapsed_time": "4:54:11", "remaining_time": "13:55:14"} +{"current_steps": 1840, "total_steps": 7064, "loss": 0.8454, "reward": null, "learning_rate": 4.208642606437748e-05, "epoch": 0.52, "percentage": 26.05, "elapsed_time": "4:54:12", "remaining_time": "13:55:16"} +{"current_steps": 1840, "total_steps": 7064, "loss": 0.8454, "reward": null, "learning_rate": 4.208642606437748e-05, "epoch": 0.52, "percentage": 26.05, "elapsed_time": "4:54:10", "remaining_time": "13:55:12"} +{"current_steps": 1850, "total_steps": 7064, "loss": 0.832, "reward": null, "learning_rate": 4.2005094648609325e-05, "epoch": 0.52, "percentage": 26.19, "elapsed_time": "4:55:50", "remaining_time": "13:53:47"} +{"current_steps": 1850, "total_steps": 7064, "loss": 0.832, "reward": null, "learning_rate": 4.2005094648609325e-05, "epoch": 0.52, "percentage": 26.19, "elapsed_time": "4:59:44", "remaining_time": "14:04:46"} +{"current_steps": 1850, "total_steps": 7064, "loss": 0.832, "reward": null, "learning_rate": 4.2005094648609325e-05, "epoch": 0.52, "percentage": 26.19, "elapsed_time": "4:55:51", "remaining_time": "13:53:49"} +{"current_steps": 1850, "total_steps": 7064, "loss": 0.832, "reward": null, "learning_rate": 4.2005094648609325e-05, "epoch": 0.52, "percentage": 26.19, "elapsed_time": "4:55:49", "remaining_time": "13:53:44"} +{"current_steps": 1860, "total_steps": 7064, "loss": 0.8027, "reward": null, "learning_rate": 4.192342689424903e-05, "epoch": 0.53, "percentage": 26.33, "elapsed_time": "4:57:27", "remaining_time": "13:52:15"} +{"current_steps": 1860, "total_steps": 7064, "loss": 0.8027, "reward": null, "learning_rate": 4.192342689424903e-05, "epoch": 0.53, "percentage": 26.33, "elapsed_time": "4:57:29", "remaining_time": "13:52:19"} +{"current_steps": 1860, "total_steps": 7064, "loss": 0.8027, "reward": null, "learning_rate": 4.192342689424903e-05, "epoch": 0.53, "percentage": 26.33, "elapsed_time": "4:57:28", "remaining_time": "13:52:17"} +{"current_steps": 1860, "total_steps": 7064, "loss": 0.8027, "reward": null, "learning_rate": 4.192342689424903e-05, "epoch": 0.53, "percentage": 26.33, "elapsed_time": "5:01:22", "remaining_time": "14:03:11"} +{"current_steps": 1870, "total_steps": 7064, "loss": 0.8365, "reward": null, "learning_rate": 4.184142441657827e-05, "epoch": 0.53, "percentage": 26.47, "elapsed_time": "4:59:05", "remaining_time": "13:50:43"} +{"current_steps": 1870, "total_steps": 7064, "loss": 0.8365, "reward": null, "learning_rate": 4.184142441657827e-05, "epoch": 0.53, "percentage": 26.47, "elapsed_time": "5:02:58", "remaining_time": "14:01:32"} +{"current_steps": 1870, "total_steps": 7064, "loss": 0.8365, "reward": null, "learning_rate": 4.184142441657827e-05, "epoch": 0.53, "percentage": 26.47, "elapsed_time": "4:59:04", "remaining_time": "13:50:40"} +{"current_steps": 1870, "total_steps": 7064, "loss": 0.8365, "reward": null, "learning_rate": 4.184142441657827e-05, "epoch": 0.53, "percentage": 26.47, "elapsed_time": "4:59:05", "remaining_time": "13:50:45"} +{"current_steps": 1880, "total_steps": 7064, "loss": 0.8523, "reward": null, "learning_rate": 4.1759088837499095e-05, "epoch": 0.53, "percentage": 26.61, "elapsed_time": "5:04:36", "remaining_time": "13:59:56"} +{"current_steps": 1880, "total_steps": 7064, "loss": 0.8523, "reward": null, "learning_rate": 4.1759088837499095e-05, "epoch": 0.53, "percentage": 26.61, "elapsed_time": "5:00:43", "remaining_time": "13:49:13"} +{"current_steps": 1880, "total_steps": 7064, "loss": 0.8523, "reward": null, "learning_rate": 4.1759088837499095e-05, "epoch": 0.53, "percentage": 26.61, "elapsed_time": "5:00:42", "remaining_time": "13:49:11"} +{"current_steps": 1880, "total_steps": 7064, "loss": 0.8523, "reward": null, "learning_rate": 4.1759088837499095e-05, "epoch": 0.53, "percentage": 26.61, "elapsed_time": "5:00:41", "remaining_time": "13:49:09"} +{"current_steps": 1890, "total_steps": 7064, "loss": 0.8377, "reward": null, "learning_rate": 4.167642178550186e-05, "epoch": 0.54, "percentage": 26.76, "elapsed_time": "5:06:12", "remaining_time": "13:58:17"} +{"current_steps": 1890, "total_steps": 7064, "loss": 0.8377, "reward": null, "learning_rate": 4.167642178550186e-05, "epoch": 0.54, "percentage": 26.76, "elapsed_time": "5:02:18", "remaining_time": "13:47:34"} +{"current_steps": 1890, "total_steps": 7064, "loss": 0.8377, "reward": null, "learning_rate": 4.167642178550186e-05, "epoch": 0.54, "percentage": 26.76, "elapsed_time": "5:02:19", "remaining_time": "13:47:39"} +{"current_steps": 1890, "total_steps": 7064, "loss": 0.8377, "reward": null, "learning_rate": 4.167642178550186e-05, "epoch": 0.54, "percentage": 26.76, "elapsed_time": "5:02:19", "remaining_time": "13:47:37"} +{"current_steps": 1900, "total_steps": 7064, "loss": 0.8299, "reward": null, "learning_rate": 4.159342489563304e-05, "epoch": 0.54, "percentage": 26.9, "elapsed_time": "5:07:50", "remaining_time": "13:56:41"} +{"current_steps": 1900, "total_steps": 7064, "loss": 0.8299, "reward": null, "learning_rate": 4.159342489563304e-05, "epoch": 0.54, "percentage": 26.9, "elapsed_time": "5:03:57", "remaining_time": "13:46:06"} +{"current_steps": 1900, "total_steps": 7064, "loss": 0.8299, "reward": null, "learning_rate": 4.159342489563304e-05, "epoch": 0.54, "percentage": 26.9, "elapsed_time": "5:03:56", "remaining_time": "13:46:04"} +{"current_steps": 1900, "total_steps": 7064, "loss": 0.8299, "reward": null, "learning_rate": 4.159342489563304e-05, "epoch": 0.54, "percentage": 26.9, "elapsed_time": "5:03:57", "remaining_time": "13:46:08"} +{"current_steps": 1910, "total_steps": 7064, "loss": 0.8273, "reward": null, "learning_rate": 4.151009980946287e-05, "epoch": 0.54, "percentage": 27.04, "elapsed_time": "5:05:30", "remaining_time": "13:44:23"} +{"current_steps": 1910, "total_steps": 7064, "loss": 0.8273, "reward": null, "learning_rate": 4.151009980946287e-05, "epoch": 0.54, "percentage": 27.04, "elapsed_time": "5:09:24", "remaining_time": "13:54:53"} +{"current_steps": 1910, "total_steps": 7064, "loss": 0.8273, "reward": null, "learning_rate": 4.151009980946287e-05, "epoch": 0.54, "percentage": 27.04, "elapsed_time": "5:05:29", "remaining_time": "13:44:20"} +{"current_steps": 1910, "total_steps": 7064, "loss": 0.8273, "reward": null, "learning_rate": 4.151009980946287e-05, "epoch": 0.54, "percentage": 27.04, "elapsed_time": "5:05:31", "remaining_time": "13:44:25"} +{"current_steps": 1920, "total_steps": 7064, "loss": 0.813, "reward": null, "learning_rate": 4.142644817505284e-05, "epoch": 0.54, "percentage": 27.18, "elapsed_time": "5:11:04", "remaining_time": "13:53:25"} +{"current_steps": 1920, "total_steps": 7064, "loss": 0.813, "reward": null, "learning_rate": 4.142644817505284e-05, "epoch": 0.54, "percentage": 27.18, "elapsed_time": "5:07:11", "remaining_time": "13:43:01"} +{"current_steps": 1920, "total_steps": 7064, "loss": 0.813, "reward": null, "learning_rate": 4.142644817505284e-05, "epoch": 0.54, "percentage": 27.18, "elapsed_time": "5:07:09", "remaining_time": "13:42:56"} +{"current_steps": 1920, "total_steps": 7064, "loss": 0.813, "reward": null, "learning_rate": 4.142644817505284e-05, "epoch": 0.54, "percentage": 27.18, "elapsed_time": "5:07:10", "remaining_time": "13:42:59"} +{"current_steps": 1930, "total_steps": 7064, "loss": 0.8262, "reward": null, "learning_rate": 4.1342471646923196e-05, "epoch": 0.55, "percentage": 27.32, "elapsed_time": "5:08:46", "remaining_time": "13:41:23"} +{"current_steps": 1930, "total_steps": 7064, "loss": 0.8262, "reward": null, "learning_rate": 4.1342471646923196e-05, "epoch": 0.55, "percentage": 27.32, "elapsed_time": "5:12:40", "remaining_time": "13:51:45"} +{"current_steps": 1930, "total_steps": 7064, "loss": 0.8262, "reward": null, "learning_rate": 4.1342471646923196e-05, "epoch": 0.55, "percentage": 27.32, "elapsed_time": "5:08:46", "remaining_time": "13:41:21"} +{"current_steps": 1930, "total_steps": 7064, "loss": 0.8262, "reward": null, "learning_rate": 4.1342471646923196e-05, "epoch": 0.55, "percentage": 27.32, "elapsed_time": "5:08:47", "remaining_time": "13:41:25"} +{"current_steps": 1940, "total_steps": 7064, "loss": 0.8258, "reward": null, "learning_rate": 4.1258171886020124e-05, "epoch": 0.55, "percentage": 27.46, "elapsed_time": "5:14:15", "remaining_time": "13:50:01"} +{"current_steps": 1940, "total_steps": 7064, "loss": 0.8258, "reward": null, "learning_rate": 4.1258171886020124e-05, "epoch": 0.55, "percentage": 27.46, "elapsed_time": "5:10:22", "remaining_time": "13:39:46"} +{"current_steps": 1940, "total_steps": 7064, "loss": 0.8258, "reward": null, "learning_rate": 4.1258171886020124e-05, "epoch": 0.55, "percentage": 27.46, "elapsed_time": "5:10:20", "remaining_time": "13:39:41"} +{"current_steps": 1940, "total_steps": 7064, "loss": 0.8258, "reward": null, "learning_rate": 4.1258171886020124e-05, "epoch": 0.55, "percentage": 27.46, "elapsed_time": "5:10:21", "remaining_time": "13:39:43"} +{"current_steps": 1950, "total_steps": 7064, "loss": 0.8248, "reward": null, "learning_rate": 4.117355055968295e-05, "epoch": 0.55, "percentage": 27.6, "elapsed_time": "5:11:57", "remaining_time": "13:38:08"} +{"current_steps": 1950, "total_steps": 7064, "loss": 0.8248, "reward": null, "learning_rate": 4.117355055968295e-05, "epoch": 0.55, "percentage": 27.6, "elapsed_time": "5:15:51", "remaining_time": "13:48:21"} +{"current_steps": 1950, "total_steps": 7064, "loss": 0.8248, "reward": null, "learning_rate": 4.117355055968295e-05, "epoch": 0.55, "percentage": 27.6, "elapsed_time": "5:11:56", "remaining_time": "13:38:06"} +{"current_steps": 1950, "total_steps": 7064, "loss": 0.8248, "reward": null, "learning_rate": 4.117355055968295e-05, "epoch": 0.55, "percentage": 27.6, "elapsed_time": "5:11:58", "remaining_time": "13:38:10"} +{"current_steps": 1960, "total_steps": 7064, "loss": 0.8123, "reward": null, "learning_rate": 4.1088609341611135e-05, "epoch": 0.55, "percentage": 27.75, "elapsed_time": "5:13:36", "remaining_time": "13:36:39"} +{"current_steps": 1960, "total_steps": 7064, "loss": 0.8123, "reward": null, "learning_rate": 4.1088609341611135e-05, "epoch": 0.55, "percentage": 27.75, "elapsed_time": "5:17:30", "remaining_time": "13:46:47"} +{"current_steps": 1960, "total_steps": 7064, "loss": 0.8123, "reward": null, "learning_rate": 4.1088609341611135e-05, "epoch": 0.55, "percentage": 27.75, "elapsed_time": "5:13:35", "remaining_time": "13:36:36"} +{"current_steps": 1960, "total_steps": 7064, "loss": 0.8123, "reward": null, "learning_rate": 4.1088609341611135e-05, "epoch": 0.55, "percentage": 27.75, "elapsed_time": "5:13:37", "remaining_time": "13:36:41"} +{"current_steps": 1970, "total_steps": 7064, "loss": 0.8304, "reward": null, "learning_rate": 4.1003349911831166e-05, "epoch": 0.56, "percentage": 27.89, "elapsed_time": "5:19:06", "remaining_time": "13:45:08"} +{"current_steps": 1970, "total_steps": 7064, "loss": 0.8304, "reward": null, "learning_rate": 4.1003349911831166e-05, "epoch": 0.56, "percentage": 27.89, "elapsed_time": "5:15:12", "remaining_time": "13:35:04"} +{"current_steps": 1970, "total_steps": 7064, "loss": 0.8304, "reward": null, "learning_rate": 4.1003349911831166e-05, "epoch": 0.56, "percentage": 27.89, "elapsed_time": "5:15:11", "remaining_time": "13:35:02"} +{"current_steps": 1970, "total_steps": 7064, "loss": 0.8304, "reward": null, "learning_rate": 4.1003349911831166e-05, "epoch": 0.56, "percentage": 27.89, "elapsed_time": "5:15:13", "remaining_time": "13:35:06"} +{"current_steps": 1980, "total_steps": 7064, "loss": 0.849, "reward": null, "learning_rate": 4.091777395666338e-05, "epoch": 0.56, "percentage": 28.03, "elapsed_time": "5:20:45", "remaining_time": "13:43:37"} +{"current_steps": 1980, "total_steps": 7064, "loss": 0.849, "reward": null, "learning_rate": 4.091777395666338e-05, "epoch": 0.56, "percentage": 28.03, "elapsed_time": "5:16:52", "remaining_time": "13:33:38"} +{"current_steps": 1980, "total_steps": 7064, "loss": 0.849, "reward": null, "learning_rate": 4.091777395666338e-05, "epoch": 0.56, "percentage": 28.03, "elapsed_time": "5:16:51", "remaining_time": "13:33:34"} +{"current_steps": 1980, "total_steps": 7064, "loss": 0.849, "reward": null, "learning_rate": 4.091777395666338e-05, "epoch": 0.56, "percentage": 28.03, "elapsed_time": "5:16:52", "remaining_time": "13:33:36"} +{"current_steps": 1990, "total_steps": 7064, "loss": 0.8255, "reward": null, "learning_rate": 4.0831883168688534e-05, "epoch": 0.56, "percentage": 28.17, "elapsed_time": "5:18:29", "remaining_time": "13:32:03"} +{"current_steps": 1990, "total_steps": 7064, "loss": 0.8255, "reward": null, "learning_rate": 4.0831883168688534e-05, "epoch": 0.56, "percentage": 28.17, "elapsed_time": "5:18:29", "remaining_time": "13:32:05"} +{"current_steps": 1990, "total_steps": 7064, "loss": 0.8255, "reward": null, "learning_rate": 4.0831883168688534e-05, "epoch": 0.56, "percentage": 28.17, "elapsed_time": "5:18:28", "remaining_time": "13:32:00"} +{"current_steps": 1990, "total_steps": 7064, "loss": 0.8255, "reward": null, "learning_rate": 4.0831883168688534e-05, "epoch": 0.56, "percentage": 28.17, "elapsed_time": "5:22:22", "remaining_time": "13:41:59"} +{"current_steps": 2000, "total_steps": 7064, "loss": 0.8317, "reward": null, "learning_rate": 4.07456792467144e-05, "epoch": 0.57, "percentage": 28.31, "elapsed_time": "5:20:08", "remaining_time": "13:30:35"} +{"current_steps": 2000, "total_steps": 7064, "loss": 0.8317, "reward": null, "learning_rate": 4.07456792467144e-05, "epoch": 0.57, "percentage": 28.31, "elapsed_time": "5:24:02", "remaining_time": "13:40:27"} +{"current_steps": 2000, "total_steps": 7064, "loss": 0.8317, "reward": null, "learning_rate": 4.07456792467144e-05, "epoch": 0.57, "percentage": 28.31, "elapsed_time": "5:20:09", "remaining_time": "13:30:37"} +{"current_steps": 2000, "total_steps": 7064, "loss": 0.8317, "reward": null, "learning_rate": 4.07456792467144e-05, "epoch": 0.57, "percentage": 28.31, "elapsed_time": "5:20:07", "remaining_time": "13:30:33"} +{"current_steps": 2010, "total_steps": 7064, "loss": 0.8331, "reward": null, "learning_rate": 4.065916389574211e-05, "epoch": 0.57, "percentage": 28.45, "elapsed_time": "5:25:39", "remaining_time": "13:38:50"} +{"current_steps": 2010, "total_steps": 7064, "loss": 0.8331, "reward": null, "learning_rate": 4.065916389574211e-05, "epoch": 0.57, "percentage": 28.45, "elapsed_time": "5:21:46", "remaining_time": "13:29:05"} +{"current_steps": 2010, "total_steps": 7064, "loss": 0.8331, "reward": null, "learning_rate": 4.065916389574211e-05, "epoch": 0.57, "percentage": 28.45, "elapsed_time": "5:21:44", "remaining_time": "13:29:00"} +{"current_steps": 2010, "total_steps": 7064, "loss": 0.8331, "reward": null, "learning_rate": 4.065916389574211e-05, "epoch": 0.57, "percentage": 28.45, "elapsed_time": "5:21:45", "remaining_time": "13:29:03"} +{"current_steps": 2020, "total_steps": 7064, "loss": 0.8309, "reward": null, "learning_rate": 4.057233882693246e-05, "epoch": 0.57, "percentage": 28.6, "elapsed_time": "5:27:17", "remaining_time": "13:37:16"} +{"current_steps": 2020, "total_steps": 7064, "loss": 0.8309, "reward": null, "learning_rate": 4.057233882693246e-05, "epoch": 0.57, "percentage": 28.6, "elapsed_time": "5:23:24", "remaining_time": "13:27:34"} +{"current_steps": 2020, "total_steps": 7064, "loss": 0.8309, "reward": null, "learning_rate": 4.057233882693246e-05, "epoch": 0.57, "percentage": 28.6, "elapsed_time": "5:23:23", "remaining_time": "13:27:30"} +{"current_steps": 2020, "total_steps": 7064, "loss": 0.8309, "reward": null, "learning_rate": 4.057233882693246e-05, "epoch": 0.57, "percentage": 28.6, "elapsed_time": "5:23:24", "remaining_time": "13:27:32"} +{"current_steps": 2030, "total_steps": 7064, "loss": 0.8117, "reward": null, "learning_rate": 4.048520575757207e-05, "epoch": 0.57, "percentage": 28.74, "elapsed_time": "5:25:04", "remaining_time": "13:26:06"} +{"current_steps": 2030, "total_steps": 7064, "loss": 0.8117, "reward": null, "learning_rate": 4.048520575757207e-05, "epoch": 0.57, "percentage": 28.74, "elapsed_time": "5:25:03", "remaining_time": "13:26:04"} +{"current_steps": 2030, "total_steps": 7064, "loss": 0.8117, "reward": null, "learning_rate": 4.048520575757207e-05, "epoch": 0.57, "percentage": 28.74, "elapsed_time": "5:25:04", "remaining_time": "13:26:08"} +{"current_steps": 2030, "total_steps": 7064, "loss": 0.8117, "reward": null, "learning_rate": 4.048520575757207e-05, "epoch": 0.57, "percentage": 28.74, "elapsed_time": "5:28:57", "remaining_time": "13:35:45"} +{"current_steps": 2040, "total_steps": 7064, "loss": 0.8155, "reward": null, "learning_rate": 4.0397766411039395e-05, "epoch": 0.58, "percentage": 28.88, "elapsed_time": "5:26:40", "remaining_time": "13:24:29"} +{"current_steps": 2040, "total_steps": 7064, "loss": 0.8155, "reward": null, "learning_rate": 4.0397766411039395e-05, "epoch": 0.58, "percentage": 28.88, "elapsed_time": "5:30:33", "remaining_time": "13:34:05"} +{"current_steps": 2040, "total_steps": 7064, "loss": 0.8155, "reward": null, "learning_rate": 4.0397766411039395e-05, "epoch": 0.58, "percentage": 28.88, "elapsed_time": "5:26:39", "remaining_time": "13:24:27"} +{"current_steps": 2040, "total_steps": 7064, "loss": 0.8155, "reward": null, "learning_rate": 4.0397766411039395e-05, "epoch": 0.58, "percentage": 28.88, "elapsed_time": "5:26:40", "remaining_time": "13:24:31"} +{"current_steps": 2050, "total_steps": 7064, "loss": 0.8178, "reward": null, "learning_rate": 4.031002251677067e-05, "epoch": 0.58, "percentage": 29.02, "elapsed_time": "5:32:06", "remaining_time": "13:32:17"} +{"current_steps": 2050, "total_steps": 7064, "loss": 0.8178, "reward": null, "learning_rate": 4.031002251677067e-05, "epoch": 0.58, "percentage": 29.02, "elapsed_time": "5:28:11", "remaining_time": "13:22:43"} +{"current_steps": 2050, "total_steps": 7064, "loss": 0.8178, "reward": null, "learning_rate": 4.031002251677067e-05, "epoch": 0.58, "percentage": 29.02, "elapsed_time": "5:28:13", "remaining_time": "13:22:47"} +{"current_steps": 2050, "total_steps": 7064, "loss": 0.8178, "reward": null, "learning_rate": 4.031002251677067e-05, "epoch": 0.58, "percentage": 29.02, "elapsed_time": "5:28:12", "remaining_time": "13:22:45"} +{"current_steps": 2060, "total_steps": 7064, "loss": 0.8155, "reward": null, "learning_rate": 4.022197581022567e-05, "epoch": 0.58, "percentage": 29.16, "elapsed_time": "5:29:52", "remaining_time": "13:21:18"} +{"current_steps": 2060, "total_steps": 7064, "loss": 0.8155, "reward": null, "learning_rate": 4.022197581022567e-05, "epoch": 0.58, "percentage": 29.16, "elapsed_time": "5:33:46", "remaining_time": "13:30:45"} +{"current_steps": 2060, "total_steps": 7064, "loss": 0.8155, "reward": null, "learning_rate": 4.022197581022567e-05, "epoch": 0.58, "percentage": 29.16, "elapsed_time": "5:29:51", "remaining_time": "13:21:15"} +{"current_steps": 2060, "total_steps": 7064, "loss": 0.8155, "reward": null, "learning_rate": 4.022197581022567e-05, "epoch": 0.58, "percentage": 29.16, "elapsed_time": "5:29:53", "remaining_time": "13:21:19"} +{"current_steps": 2070, "total_steps": 7064, "loss": 0.8273, "reward": null, "learning_rate": 4.0133628032853435e-05, "epoch": 0.59, "percentage": 29.3, "elapsed_time": "5:31:27", "remaining_time": "13:19:38"} +{"current_steps": 2070, "total_steps": 7064, "loss": 0.8273, "reward": null, "learning_rate": 4.0133628032853435e-05, "epoch": 0.59, "percentage": 29.3, "elapsed_time": "5:31:27", "remaining_time": "13:19:40"} +{"current_steps": 2070, "total_steps": 7064, "loss": 0.8273, "reward": null, "learning_rate": 4.0133628032853435e-05, "epoch": 0.59, "percentage": 29.3, "elapsed_time": "5:35:20", "remaining_time": "13:29:02"} +{"current_steps": 2070, "total_steps": 7064, "loss": 0.8273, "reward": null, "learning_rate": 4.0133628032853435e-05, "epoch": 0.59, "percentage": 29.3, "elapsed_time": "5:31:26", "remaining_time": "13:19:36"} +{"current_steps": 2080, "total_steps": 7064, "loss": 0.8021, "reward": null, "learning_rate": 4.004498093205773e-05, "epoch": 0.59, "percentage": 29.45, "elapsed_time": "5:36:56", "remaining_time": "13:27:21"} +{"current_steps": 2080, "total_steps": 7064, "loss": 0.8021, "reward": null, "learning_rate": 4.004498093205773e-05, "epoch": 0.59, "percentage": 29.45, "elapsed_time": "5:33:03", "remaining_time": "13:18:03"} +{"current_steps": 2080, "total_steps": 7064, "loss": 0.8021, "reward": null, "learning_rate": 4.004498093205773e-05, "epoch": 0.59, "percentage": 29.45, "elapsed_time": "5:33:02", "remaining_time": "13:18:01"} +{"current_steps": 2080, "total_steps": 7064, "loss": 0.8021, "reward": null, "learning_rate": 4.004498093205773e-05, "epoch": 0.59, "percentage": 29.45, "elapsed_time": "5:33:01", "remaining_time": "13:17:59"} +{"current_steps": 2090, "total_steps": 7064, "loss": 0.8374, "reward": null, "learning_rate": 3.99560362611626e-05, "epoch": 0.59, "percentage": 29.59, "elapsed_time": "5:38:31", "remaining_time": "13:25:39"} +{"current_steps": 2090, "total_steps": 7064, "loss": 0.8374, "reward": null, "learning_rate": 3.99560362611626e-05, "epoch": 0.59, "percentage": 29.59, "elapsed_time": "5:34:38", "remaining_time": "13:16:25"} +{"current_steps": 2090, "total_steps": 7064, "loss": 0.8374, "reward": null, "learning_rate": 3.99560362611626e-05, "epoch": 0.59, "percentage": 29.59, "elapsed_time": "5:34:37", "remaining_time": "13:16:21"} +{"current_steps": 2090, "total_steps": 7064, "loss": 0.8374, "reward": null, "learning_rate": 3.99560362611626e-05, "epoch": 0.59, "percentage": 29.59, "elapsed_time": "5:34:38", "remaining_time": "13:16:23"} +{"current_steps": 2100, "total_steps": 7064, "loss": 0.8173, "reward": null, "learning_rate": 3.986679577937762e-05, "epoch": 0.59, "percentage": 29.73, "elapsed_time": "5:36:16", "remaining_time": "13:14:54"} +{"current_steps": 2100, "total_steps": 7064, "loss": 0.8173, "reward": null, "learning_rate": 3.986679577937762e-05, "epoch": 0.59, "percentage": 29.73, "elapsed_time": "5:40:10", "remaining_time": "13:24:06"} +{"current_steps": 2100, "total_steps": 7064, "loss": 0.8173, "reward": null, "learning_rate": 3.986679577937762e-05, "epoch": 0.59, "percentage": 29.73, "elapsed_time": "5:36:15", "remaining_time": "13:14:52"} +{"current_steps": 2100, "total_steps": 7064, "loss": 0.8173, "reward": null, "learning_rate": 3.986679577937762e-05, "epoch": 0.59, "percentage": 29.73, "elapsed_time": "5:36:17", "remaining_time": "13:14:56"} +{"current_steps": 2110, "total_steps": 7064, "loss": 0.8227, "reward": null, "learning_rate": 3.9777261251763145e-05, "epoch": 0.6, "percentage": 29.87, "elapsed_time": "5:37:59", "remaining_time": "13:13:32"} +{"current_steps": 2110, "total_steps": 7064, "loss": 0.8227, "reward": null, "learning_rate": 3.9777261251763145e-05, "epoch": 0.6, "percentage": 29.87, "elapsed_time": "5:41:52", "remaining_time": "13:22:41"} +{"current_steps": 2110, "total_steps": 7064, "loss": 0.8227, "reward": null, "learning_rate": 3.9777261251763145e-05, "epoch": 0.6, "percentage": 29.87, "elapsed_time": "5:37:59", "remaining_time": "13:13:34"} +{"current_steps": 2110, "total_steps": 7064, "loss": 0.8227, "reward": null, "learning_rate": 3.9777261251763145e-05, "epoch": 0.6, "percentage": 29.87, "elapsed_time": "5:37:58", "remaining_time": "13:13:30"} +{"current_steps": 2120, "total_steps": 7064, "loss": 0.8275, "reward": null, "learning_rate": 3.9687434449195316e-05, "epoch": 0.6, "percentage": 30.01, "elapsed_time": "5:39:36", "remaining_time": "13:11:59"} +{"current_steps": 2120, "total_steps": 7064, "loss": 0.8275, "reward": null, "learning_rate": 3.9687434449195316e-05, "epoch": 0.6, "percentage": 30.01, "elapsed_time": "5:39:35", "remaining_time": "13:11:56"} +{"current_steps": 2120, "total_steps": 7064, "loss": 0.8275, "reward": null, "learning_rate": 3.9687434449195316e-05, "epoch": 0.6, "percentage": 30.01, "elapsed_time": "5:39:37", "remaining_time": "13:12:00"} +{"current_steps": 2120, "total_steps": 7064, "loss": 0.8275, "reward": null, "learning_rate": 3.9687434449195316e-05, "epoch": 0.6, "percentage": 30.01, "elapsed_time": "5:43:29", "remaining_time": "13:21:04"} +{"current_steps": 2130, "total_steps": 7064, "loss": 0.8226, "reward": null, "learning_rate": 3.959731714833115e-05, "epoch": 0.6, "percentage": 30.15, "elapsed_time": "5:45:10", "remaining_time": "13:19:33"} +{"current_steps": 2130, "total_steps": 7064, "loss": 0.8226, "reward": null, "learning_rate": 3.959731714833115e-05, "epoch": 0.6, "percentage": 30.15, "elapsed_time": "5:41:15", "remaining_time": "13:10:30"} +{"current_steps": 2130, "total_steps": 7064, "loss": 0.8226, "reward": null, "learning_rate": 3.959731714833115e-05, "epoch": 0.6, "percentage": 30.15, "elapsed_time": "5:41:17", "remaining_time": "13:10:34"} +{"current_steps": 2130, "total_steps": 7064, "loss": 0.8226, "reward": null, "learning_rate": 3.959731714833115e-05, "epoch": 0.6, "percentage": 30.15, "elapsed_time": "5:41:16", "remaining_time": "13:10:32"} +{"current_steps": 2140, "total_steps": 7064, "loss": 0.815, "reward": null, "learning_rate": 3.95069111315733e-05, "epoch": 0.61, "percentage": 30.29, "elapsed_time": "5:46:47", "remaining_time": "13:17:55"} +{"current_steps": 2140, "total_steps": 7064, "loss": 0.815, "reward": null, "learning_rate": 3.95069111315733e-05, "epoch": 0.61, "percentage": 30.29, "elapsed_time": "5:42:52", "remaining_time": "13:08:55"} +{"current_steps": 2140, "total_steps": 7064, "loss": 0.815, "reward": null, "learning_rate": 3.95069111315733e-05, "epoch": 0.61, "percentage": 30.29, "elapsed_time": "5:42:54", "remaining_time": "13:08:59"} +{"current_steps": 2140, "total_steps": 7064, "loss": 0.815, "reward": null, "learning_rate": 3.95069111315733e-05, "epoch": 0.61, "percentage": 30.29, "elapsed_time": "5:42:53", "remaining_time": "13:08:58"} +{"current_steps": 2150, "total_steps": 7064, "loss": 0.8306, "reward": null, "learning_rate": 3.9416218187034876e-05, "epoch": 0.61, "percentage": 30.44, "elapsed_time": "5:44:29", "remaining_time": "13:07:20"} +{"current_steps": 2150, "total_steps": 7064, "loss": 0.8306, "reward": null, "learning_rate": 3.9416218187034876e-05, "epoch": 0.61, "percentage": 30.44, "elapsed_time": "5:44:29", "remaining_time": "13:07:22"} +{"current_steps": 2150, "total_steps": 7064, "loss": 0.8306, "reward": null, "learning_rate": 3.9416218187034876e-05, "epoch": 0.61, "percentage": 30.44, "elapsed_time": "5:44:28", "remaining_time": "13:07:18"} +{"current_steps": 2150, "total_steps": 7064, "loss": 0.8306, "reward": null, "learning_rate": 3.9416218187034876e-05, "epoch": 0.61, "percentage": 30.44, "elapsed_time": "5:48:22", "remaining_time": "13:16:14"} +{"current_steps": 2160, "total_steps": 7064, "loss": 0.8424, "reward": null, "learning_rate": 3.9325240108504016e-05, "epoch": 0.61, "percentage": 30.58, "elapsed_time": "5:50:04", "remaining_time": "13:14:47"} +{"current_steps": 2160, "total_steps": 7064, "loss": 0.8424, "reward": null, "learning_rate": 3.9325240108504016e-05, "epoch": 0.61, "percentage": 30.58, "elapsed_time": "5:46:09", "remaining_time": "13:05:55"} +{"current_steps": 2160, "total_steps": 7064, "loss": 0.8424, "reward": null, "learning_rate": 3.9325240108504016e-05, "epoch": 0.61, "percentage": 30.58, "elapsed_time": "5:46:10", "remaining_time": "13:05:57"} +{"current_steps": 2160, "total_steps": 7064, "loss": 0.8424, "reward": null, "learning_rate": 3.9325240108504016e-05, "epoch": 0.61, "percentage": 30.58, "elapsed_time": "5:46:11", "remaining_time": "13:05:59"} +{"current_steps": 2170, "total_steps": 7064, "loss": 0.8051, "reward": null, "learning_rate": 3.923397869540845e-05, "epoch": 0.61, "percentage": 30.72, "elapsed_time": "5:47:44", "remaining_time": "13:04:16"} +{"current_steps": 2170, "total_steps": 7064, "loss": 0.8051, "reward": null, "learning_rate": 3.923397869540845e-05, "epoch": 0.61, "percentage": 30.72, "elapsed_time": "5:47:43", "remaining_time": "13:04:14"} +{"current_steps": 2170, "total_steps": 7064, "loss": 0.8051, "reward": null, "learning_rate": 3.923397869540845e-05, "epoch": 0.61, "percentage": 30.72, "elapsed_time": "5:47:45", "remaining_time": "13:04:17"} +{"current_steps": 2170, "total_steps": 7064, "loss": 0.8051, "reward": null, "learning_rate": 3.923397869540845e-05, "epoch": 0.61, "percentage": 30.72, "elapsed_time": "5:51:38", "remaining_time": "13:13:03"} +{"current_steps": 2180, "total_steps": 7064, "loss": 0.8117, "reward": null, "learning_rate": 3.91424357527799e-05, "epoch": 0.62, "percentage": 30.86, "elapsed_time": "5:49:16", "remaining_time": "13:02:29"} +{"current_steps": 2180, "total_steps": 7064, "loss": 0.8117, "reward": null, "learning_rate": 3.91424357527799e-05, "epoch": 0.62, "percentage": 30.86, "elapsed_time": "5:53:10", "remaining_time": "13:11:13"} +{"current_steps": 2180, "total_steps": 7064, "loss": 0.8117, "reward": null, "learning_rate": 3.91424357527799e-05, "epoch": 0.62, "percentage": 30.86, "elapsed_time": "5:49:15", "remaining_time": "13:02:27"} +{"current_steps": 2180, "total_steps": 7064, "loss": 0.8117, "reward": null, "learning_rate": 3.91424357527799e-05, "epoch": 0.62, "percentage": 30.86, "elapsed_time": "5:49:17", "remaining_time": "13:02:31"} +{"current_steps": 2190, "total_steps": 7064, "loss": 0.8123, "reward": null, "learning_rate": 3.905061309121837e-05, "epoch": 0.62, "percentage": 31.0, "elapsed_time": "5:50:50", "remaining_time": "13:00:50"} +{"current_steps": 2190, "total_steps": 7064, "loss": 0.8123, "reward": null, "learning_rate": 3.905061309121837e-05, "epoch": 0.62, "percentage": 31.0, "elapsed_time": "5:50:51", "remaining_time": "13:00:52"} +{"current_steps": 2190, "total_steps": 7064, "loss": 0.8123, "reward": null, "learning_rate": 3.905061309121837e-05, "epoch": 0.62, "percentage": 31.0, "elapsed_time": "5:50:50", "remaining_time": "13:00:48"} +{"current_steps": 2190, "total_steps": 7064, "loss": 0.8123, "reward": null, "learning_rate": 3.905061309121837e-05, "epoch": 0.62, "percentage": 31.0, "elapsed_time": "5:54:44", "remaining_time": "13:09:30"} +{"current_steps": 2200, "total_steps": 7064, "loss": 0.8038, "reward": null, "learning_rate": 3.895851252685634e-05, "epoch": 0.62, "percentage": 31.14, "elapsed_time": "5:52:29", "remaining_time": "12:59:19"} +{"current_steps": 2200, "total_steps": 7064, "loss": 0.8038, "reward": null, "learning_rate": 3.895851252685634e-05, "epoch": 0.62, "percentage": 31.14, "elapsed_time": "5:56:23", "remaining_time": "13:07:56"} +{"current_steps": 2200, "total_steps": 7064, "loss": 0.8038, "reward": null, "learning_rate": 3.895851252685634e-05, "epoch": 0.62, "percentage": 31.14, "elapsed_time": "5:52:28", "remaining_time": "12:59:17"} +{"current_steps": 2200, "total_steps": 7064, "loss": 0.8038, "reward": null, "learning_rate": 3.895851252685634e-05, "epoch": 0.62, "percentage": 31.14, "elapsed_time": "5:52:30", "remaining_time": "12:59:21"} +{"current_steps": 2210, "total_steps": 7064, "loss": 0.8308, "reward": null, "learning_rate": 3.886613588132284e-05, "epoch": 0.63, "percentage": 31.29, "elapsed_time": "5:54:05", "remaining_time": "12:57:43"} +{"current_steps": 2210, "total_steps": 7064, "loss": 0.8308, "reward": null, "learning_rate": 3.886613588132284e-05, "epoch": 0.63, "percentage": 31.29, "elapsed_time": "5:54:06", "remaining_time": "12:57:44"} +{"current_steps": 2210, "total_steps": 7064, "loss": 0.8308, "reward": null, "learning_rate": 3.886613588132284e-05, "epoch": 0.63, "percentage": 31.29, "elapsed_time": "5:54:04", "remaining_time": "12:57:41"} +{"current_steps": 2210, "total_steps": 7064, "loss": 0.8308, "reward": null, "learning_rate": 3.886613588132284e-05, "epoch": 0.63, "percentage": 31.29, "elapsed_time": "5:57:59", "remaining_time": "13:06:16"} +{"current_steps": 2220, "total_steps": 7064, "loss": 0.8187, "reward": null, "learning_rate": 3.877348498170743e-05, "epoch": 0.63, "percentage": 31.43, "elapsed_time": "5:59:41", "remaining_time": "13:04:49"} +{"current_steps": 2220, "total_steps": 7064, "loss": 0.8187, "reward": null, "learning_rate": 3.877348498170743e-05, "epoch": 0.63, "percentage": 31.43, "elapsed_time": "5:55:46", "remaining_time": "12:56:17"} +{"current_steps": 2220, "total_steps": 7064, "loss": 0.8187, "reward": null, "learning_rate": 3.877348498170743e-05, "epoch": 0.63, "percentage": 31.43, "elapsed_time": "5:55:48", "remaining_time": "12:56:21"} +{"current_steps": 2220, "total_steps": 7064, "loss": 0.8187, "reward": null, "learning_rate": 3.877348498170743e-05, "epoch": 0.63, "percentage": 31.43, "elapsed_time": "5:55:47", "remaining_time": "12:56:19"} +{"current_steps": 2230, "total_steps": 7064, "loss": 0.8274, "reward": null, "learning_rate": 3.868056166052407e-05, "epoch": 0.63, "percentage": 31.57, "elapsed_time": "5:57:26", "remaining_time": "12:54:50"} +{"current_steps": 2230, "total_steps": 7064, "loss": 0.8274, "reward": null, "learning_rate": 3.868056166052407e-05, "epoch": 0.63, "percentage": 31.57, "elapsed_time": "6:01:20", "remaining_time": "13:03:17"} +{"current_steps": 2230, "total_steps": 7064, "loss": 0.8274, "reward": null, "learning_rate": 3.868056166052407e-05, "epoch": 0.63, "percentage": 31.57, "elapsed_time": "5:57:27", "remaining_time": "12:54:52"} +{"current_steps": 2230, "total_steps": 7064, "loss": 0.8274, "reward": null, "learning_rate": 3.868056166052407e-05, "epoch": 0.63, "percentage": 31.57, "elapsed_time": "5:57:26", "remaining_time": "12:54:48"} +{"current_steps": 2240, "total_steps": 7064, "loss": 0.8171, "reward": null, "learning_rate": 3.858736775567484e-05, "epoch": 0.63, "percentage": 31.71, "elapsed_time": "6:02:55", "remaining_time": "13:01:35"} +{"current_steps": 2240, "total_steps": 7064, "loss": 0.8171, "reward": null, "learning_rate": 3.858736775567484e-05, "epoch": 0.63, "percentage": 31.71, "elapsed_time": "5:59:01", "remaining_time": "12:53:10"} +{"current_steps": 2240, "total_steps": 7064, "loss": 0.8171, "reward": null, "learning_rate": 3.858736775567484e-05, "epoch": 0.63, "percentage": 31.71, "elapsed_time": "5:59:02", "remaining_time": "12:53:13"} +{"current_steps": 2240, "total_steps": 7064, "loss": 0.8171, "reward": null, "learning_rate": 3.858736775567484e-05, "epoch": 0.63, "percentage": 31.71, "elapsed_time": "5:59:02", "remaining_time": "12:53:12"} +{"current_steps": 2250, "total_steps": 7064, "loss": 0.8213, "reward": null, "learning_rate": 3.8493905110413626e-05, "epoch": 0.64, "percentage": 31.85, "elapsed_time": "6:00:41", "remaining_time": "12:51:42"} +{"current_steps": 2250, "total_steps": 7064, "loss": 0.8213, "reward": null, "learning_rate": 3.8493905110413626e-05, "epoch": 0.64, "percentage": 31.85, "elapsed_time": "6:04:34", "remaining_time": "13:00:02"} +{"current_steps": 2250, "total_steps": 7064, "loss": 0.8213, "reward": null, "learning_rate": 3.8493905110413626e-05, "epoch": 0.64, "percentage": 31.85, "elapsed_time": "6:00:40", "remaining_time": "12:51:40"} +{"current_steps": 2250, "total_steps": 7064, "loss": 0.8213, "reward": null, "learning_rate": 3.8493905110413626e-05, "epoch": 0.64, "percentage": 31.85, "elapsed_time": "6:00:42", "remaining_time": "12:51:44"} +{"current_steps": 2260, "total_steps": 7064, "loss": 0.8241, "reward": null, "learning_rate": 3.8400175573309646e-05, "epoch": 0.64, "percentage": 31.99, "elapsed_time": "6:06:14", "remaining_time": "12:58:29"} +{"current_steps": 2260, "total_steps": 7064, "loss": 0.8241, "reward": null, "learning_rate": 3.8400175573309646e-05, "epoch": 0.64, "percentage": 31.99, "elapsed_time": "6:02:20", "remaining_time": "12:50:13"} +{"current_steps": 2260, "total_steps": 7064, "loss": 0.8241, "reward": null, "learning_rate": 3.8400175573309646e-05, "epoch": 0.64, "percentage": 31.99, "elapsed_time": "6:02:19", "remaining_time": "12:50:11"} +{"current_steps": 2260, "total_steps": 7064, "loss": 0.8241, "reward": null, "learning_rate": 3.8400175573309646e-05, "epoch": 0.64, "percentage": 31.99, "elapsed_time": "6:02:21", "remaining_time": "12:50:14"} +{"current_steps": 2270, "total_steps": 7064, "loss": 0.8296, "reward": null, "learning_rate": 3.83061809982109e-05, "epoch": 0.64, "percentage": 32.13, "elapsed_time": "6:07:48", "remaining_time": "12:56:46"} +{"current_steps": 2270, "total_steps": 7064, "loss": 0.8296, "reward": null, "learning_rate": 3.83061809982109e-05, "epoch": 0.64, "percentage": 32.13, "elapsed_time": "6:03:54", "remaining_time": "12:48:31"} +{"current_steps": 2270, "total_steps": 7064, "loss": 0.8296, "reward": null, "learning_rate": 3.83061809982109e-05, "epoch": 0.64, "percentage": 32.13, "elapsed_time": "6:03:55", "remaining_time": "12:48:34"} +{"current_steps": 2270, "total_steps": 7064, "loss": 0.8296, "reward": null, "learning_rate": 3.83061809982109e-05, "epoch": 0.64, "percentage": 32.13, "elapsed_time": "6:03:54", "remaining_time": "12:48:33"} +{"current_steps": 2280, "total_steps": 7064, "loss": 0.8247, "reward": null, "learning_rate": 3.821192324420747e-05, "epoch": 0.65, "percentage": 32.28, "elapsed_time": "6:05:34", "remaining_time": "12:47:04"} +{"current_steps": 2280, "total_steps": 7064, "loss": 0.8247, "reward": null, "learning_rate": 3.821192324420747e-05, "epoch": 0.65, "percentage": 32.28, "elapsed_time": "6:09:28", "remaining_time": "12:55:14"} +{"current_steps": 2280, "total_steps": 7064, "loss": 0.8247, "reward": null, "learning_rate": 3.821192324420747e-05, "epoch": 0.65, "percentage": 32.28, "elapsed_time": "6:05:33", "remaining_time": "12:47:02"} +{"current_steps": 2280, "total_steps": 7064, "loss": 0.8247, "reward": null, "learning_rate": 3.821192324420747e-05, "epoch": 0.65, "percentage": 32.28, "elapsed_time": "6:05:35", "remaining_time": "12:47:06"} +{"current_steps": 2290, "total_steps": 7064, "loss": 0.8399, "reward": null, "learning_rate": 3.8117404175594795e-05, "epoch": 0.65, "percentage": 32.42, "elapsed_time": "6:07:12", "remaining_time": "12:45:31"} +{"current_steps": 2290, "total_steps": 7064, "loss": 0.8399, "reward": null, "learning_rate": 3.8117404175594795e-05, "epoch": 0.65, "percentage": 32.42, "elapsed_time": "6:07:13", "remaining_time": "12:45:33"} +{"current_steps": 2290, "total_steps": 7064, "loss": 0.8399, "reward": null, "learning_rate": 3.8117404175594795e-05, "epoch": 0.65, "percentage": 32.42, "elapsed_time": "6:07:11", "remaining_time": "12:45:30"} +{"current_steps": 2290, "total_steps": 7064, "loss": 0.8399, "reward": null, "learning_rate": 3.8117404175594795e-05, "epoch": 0.65, "percentage": 32.42, "elapsed_time": "6:11:06", "remaining_time": "12:53:39"} +{"current_steps": 2300, "total_steps": 7064, "loss": 0.8015, "reward": null, "learning_rate": 3.8022625661836775e-05, "epoch": 0.65, "percentage": 32.56, "elapsed_time": "6:08:47", "remaining_time": "12:43:53"} +{"current_steps": 2300, "total_steps": 7064, "loss": 0.8015, "reward": null, "learning_rate": 3.8022625661836775e-05, "epoch": 0.65, "percentage": 32.56, "elapsed_time": "6:12:41", "remaining_time": "12:51:57"} +{"current_steps": 2300, "total_steps": 7064, "loss": 0.8015, "reward": null, "learning_rate": 3.8022625661836775e-05, "epoch": 0.65, "percentage": 32.56, "elapsed_time": "6:08:48", "remaining_time": "12:43:54"} +{"current_steps": 2300, "total_steps": 7064, "loss": 0.8015, "reward": null, "learning_rate": 3.8022625661836775e-05, "epoch": 0.65, "percentage": 32.56, "elapsed_time": "6:08:46", "remaining_time": "12:43:51"} +{"current_steps": 2310, "total_steps": 7064, "loss": 0.8204, "reward": null, "learning_rate": 3.792758957752879e-05, "epoch": 0.65, "percentage": 32.7, "elapsed_time": "6:14:20", "remaining_time": "12:50:23"} +{"current_steps": 2310, "total_steps": 7064, "loss": 0.8204, "reward": null, "learning_rate": 3.792758957752879e-05, "epoch": 0.65, "percentage": 32.7, "elapsed_time": "6:10:26", "remaining_time": "12:42:23"} +{"current_steps": 2310, "total_steps": 7064, "loss": 0.8204, "reward": null, "learning_rate": 3.792758957752879e-05, "epoch": 0.65, "percentage": 32.7, "elapsed_time": "6:10:25", "remaining_time": "12:42:21"} +{"current_steps": 2310, "total_steps": 7064, "loss": 0.8204, "reward": null, "learning_rate": 3.792758957752879e-05, "epoch": 0.65, "percentage": 32.7, "elapsed_time": "6:10:27", "remaining_time": "12:42:24"} +{"current_steps": 2320, "total_steps": 7064, "loss": 0.8198, "reward": null, "learning_rate": 3.783229780236062e-05, "epoch": 0.66, "percentage": 32.84, "elapsed_time": "6:12:04", "remaining_time": "12:40:49"} +{"current_steps": 2320, "total_steps": 7064, "loss": 0.8198, "reward": null, "learning_rate": 3.783229780236062e-05, "epoch": 0.66, "percentage": 32.84, "elapsed_time": "6:12:04", "remaining_time": "12:40:50"} +{"current_steps": 2320, "total_steps": 7064, "loss": 0.8198, "reward": null, "learning_rate": 3.783229780236062e-05, "epoch": 0.66, "percentage": 32.84, "elapsed_time": "6:12:03", "remaining_time": "12:40:47"} +{"current_steps": 2320, "total_steps": 7064, "loss": 0.8198, "reward": null, "learning_rate": 3.783229780236062e-05, "epoch": 0.66, "percentage": 32.84, "elapsed_time": "6:15:57", "remaining_time": "12:48:46"} +{"current_steps": 2330, "total_steps": 7064, "loss": 0.8045, "reward": null, "learning_rate": 3.773675222107929e-05, "epoch": 0.66, "percentage": 32.98, "elapsed_time": "6:17:36", "remaining_time": "12:47:12"} +{"current_steps": 2330, "total_steps": 7064, "loss": 0.8045, "reward": null, "learning_rate": 3.773675222107929e-05, "epoch": 0.66, "percentage": 32.98, "elapsed_time": "6:13:43", "remaining_time": "12:39:19"} +{"current_steps": 2330, "total_steps": 7064, "loss": 0.8045, "reward": null, "learning_rate": 3.773675222107929e-05, "epoch": 0.66, "percentage": 32.98, "elapsed_time": "6:13:41", "remaining_time": "12:39:15"} +{"current_steps": 2330, "total_steps": 7064, "loss": 0.8045, "reward": null, "learning_rate": 3.773675222107929e-05, "epoch": 0.66, "percentage": 32.98, "elapsed_time": "6:13:42", "remaining_time": "12:39:17"} +{"current_steps": 2340, "total_steps": 7064, "loss": 0.8185, "reward": null, "learning_rate": 3.7640954723451784e-05, "epoch": 0.66, "percentage": 33.13, "elapsed_time": "6:19:13", "remaining_time": "12:45:35"} +{"current_steps": 2340, "total_steps": 7064, "loss": 0.8185, "reward": null, "learning_rate": 3.7640954723451784e-05, "epoch": 0.66, "percentage": 33.13, "elapsed_time": "6:15:19", "remaining_time": "12:37:43"} +{"current_steps": 2340, "total_steps": 7064, "loss": 0.8185, "reward": null, "learning_rate": 3.7640954723451784e-05, "epoch": 0.66, "percentage": 33.13, "elapsed_time": "6:15:19", "remaining_time": "12:37:41"} +{"current_steps": 2340, "total_steps": 7064, "loss": 0.8185, "reward": null, "learning_rate": 3.7640954723451784e-05, "epoch": 0.66, "percentage": 33.13, "elapsed_time": "6:15:20", "remaining_time": "12:37:44"} +{"current_steps": 2350, "total_steps": 7064, "loss": 0.8123, "reward": null, "learning_rate": 3.7544907204227646e-05, "epoch": 0.67, "percentage": 33.27, "elapsed_time": "6:20:48", "remaining_time": "12:43:52"} +{"current_steps": 2350, "total_steps": 7064, "loss": 0.8123, "reward": null, "learning_rate": 3.7544907204227646e-05, "epoch": 0.67, "percentage": 33.27, "elapsed_time": "6:16:55", "remaining_time": "12:36:05"} +{"current_steps": 2350, "total_steps": 7064, "loss": 0.8123, "reward": null, "learning_rate": 3.7544907204227646e-05, "epoch": 0.67, "percentage": 33.27, "elapsed_time": "6:16:53", "remaining_time": "12:36:02"} +{"current_steps": 2350, "total_steps": 7064, "loss": 0.8123, "reward": null, "learning_rate": 3.7544907204227646e-05, "epoch": 0.67, "percentage": 33.27, "elapsed_time": "6:16:54", "remaining_time": "12:36:04"} +{"current_steps": 2360, "total_steps": 7064, "loss": 0.8093, "reward": null, "learning_rate": 3.7448611563101536e-05, "epoch": 0.67, "percentage": 33.41, "elapsed_time": "6:18:31", "remaining_time": "12:34:29"} +{"current_steps": 2360, "total_steps": 7064, "loss": 0.8093, "reward": null, "learning_rate": 3.7448611563101536e-05, "epoch": 0.67, "percentage": 33.41, "elapsed_time": "6:22:25", "remaining_time": "12:42:15"} +{"current_steps": 2360, "total_steps": 7064, "loss": 0.8093, "reward": null, "learning_rate": 3.7448611563101536e-05, "epoch": 0.67, "percentage": 33.41, "elapsed_time": "6:18:31", "remaining_time": "12:34:28"} +{"current_steps": 2360, "total_steps": 7064, "loss": 0.8093, "reward": null, "learning_rate": 3.7448611563101536e-05, "epoch": 0.67, "percentage": 33.41, "elapsed_time": "6:18:32", "remaining_time": "12:34:31"} +{"current_steps": 2370, "total_steps": 7064, "loss": 0.8194, "reward": null, "learning_rate": 3.735206970467564e-05, "epoch": 0.67, "percentage": 33.55, "elapsed_time": "6:24:03", "remaining_time": "12:40:38"} +{"current_steps": 2370, "total_steps": 7064, "loss": 0.8194, "reward": null, "learning_rate": 3.735206970467564e-05, "epoch": 0.67, "percentage": 33.55, "elapsed_time": "6:20:09", "remaining_time": "12:32:55"} +{"current_steps": 2370, "total_steps": 7064, "loss": 0.8194, "reward": null, "learning_rate": 3.735206970467564e-05, "epoch": 0.67, "percentage": 33.55, "elapsed_time": "6:20:08", "remaining_time": "12:32:54"} +{"current_steps": 2370, "total_steps": 7064, "loss": 0.8194, "reward": null, "learning_rate": 3.735206970467564e-05, "epoch": 0.67, "percentage": 33.55, "elapsed_time": "6:20:10", "remaining_time": "12:32:57"} +{"current_steps": 2380, "total_steps": 7064, "loss": 0.8121, "reward": null, "learning_rate": 3.7255283538421984e-05, "epoch": 0.67, "percentage": 33.69, "elapsed_time": "6:21:47", "remaining_time": "12:31:23"} +{"current_steps": 2380, "total_steps": 7064, "loss": 0.8121, "reward": null, "learning_rate": 3.7255283538421984e-05, "epoch": 0.67, "percentage": 33.69, "elapsed_time": "6:25:41", "remaining_time": "12:39:03"} +{"current_steps": 2380, "total_steps": 7064, "loss": 0.8121, "reward": null, "learning_rate": 3.7255283538421984e-05, "epoch": 0.67, "percentage": 33.69, "elapsed_time": "6:21:48", "remaining_time": "12:31:25"} +{"current_steps": 2380, "total_steps": 7064, "loss": 0.8121, "reward": null, "learning_rate": 3.7255283538421984e-05, "epoch": 0.67, "percentage": 33.69, "elapsed_time": "6:21:46", "remaining_time": "12:31:22"} +{"current_steps": 2390, "total_steps": 7064, "loss": 0.811, "reward": null, "learning_rate": 3.7158254978644703e-05, "epoch": 0.68, "percentage": 33.83, "elapsed_time": "6:23:23", "remaining_time": "12:29:46"} +{"current_steps": 2390, "total_steps": 7064, "loss": 0.811, "reward": null, "learning_rate": 3.7158254978644703e-05, "epoch": 0.68, "percentage": 33.83, "elapsed_time": "6:27:17", "remaining_time": "12:37:24"} +{"current_steps": 2390, "total_steps": 7064, "loss": 0.811, "reward": null, "learning_rate": 3.7158254978644703e-05, "epoch": 0.68, "percentage": 33.83, "elapsed_time": "6:23:22", "remaining_time": "12:29:45"} +{"current_steps": 2390, "total_steps": 7064, "loss": 0.811, "reward": null, "learning_rate": 3.7158254978644703e-05, "epoch": 0.68, "percentage": 33.83, "elapsed_time": "6:23:24", "remaining_time": "12:29:48"} +{"current_steps": 2400, "total_steps": 7064, "loss": 0.8013, "reward": null, "learning_rate": 3.706098594444216e-05, "epoch": 0.68, "percentage": 33.98, "elapsed_time": "6:24:59", "remaining_time": "12:28:10"} +{"current_steps": 2400, "total_steps": 7064, "loss": 0.8013, "reward": null, "learning_rate": 3.706098594444216e-05, "epoch": 0.68, "percentage": 33.98, "elapsed_time": "6:28:53", "remaining_time": "12:35:45"} +{"current_steps": 2400, "total_steps": 7064, "loss": 0.8013, "reward": null, "learning_rate": 3.706098594444216e-05, "epoch": 0.68, "percentage": 33.98, "elapsed_time": "6:24:59", "remaining_time": "12:28:09"} +{"current_steps": 2400, "total_steps": 7064, "loss": 0.8013, "reward": null, "learning_rate": 3.706098594444216e-05, "epoch": 0.68, "percentage": 33.98, "elapsed_time": "6:25:00", "remaining_time": "12:28:12"} +{"current_steps": 2410, "total_steps": 7064, "loss": 0.8215, "reward": null, "learning_rate": 3.6963478359668966e-05, "epoch": 0.68, "percentage": 34.12, "elapsed_time": "6:30:32", "remaining_time": "12:34:11"} +{"current_steps": 2410, "total_steps": 7064, "loss": 0.8215, "reward": null, "learning_rate": 3.6963478359668966e-05, "epoch": 0.68, "percentage": 34.12, "elapsed_time": "6:26:37", "remaining_time": "12:26:38"} +{"current_steps": 2410, "total_steps": 7064, "loss": 0.8215, "reward": null, "learning_rate": 3.6963478359668966e-05, "epoch": 0.68, "percentage": 34.12, "elapsed_time": "6:26:39", "remaining_time": "12:26:41"} +{"current_steps": 2410, "total_steps": 7064, "loss": 0.8215, "reward": null, "learning_rate": 3.6963478359668966e-05, "epoch": 0.68, "percentage": 34.12, "elapsed_time": "6:26:38", "remaining_time": "12:26:39"} +{"current_steps": 2420, "total_steps": 7064, "loss": 0.8079, "reward": null, "learning_rate": 3.6865734152897987e-05, "epoch": 0.69, "percentage": 34.26, "elapsed_time": "6:32:09", "remaining_time": "12:32:33"} +{"current_steps": 2420, "total_steps": 7064, "loss": 0.8079, "reward": null, "learning_rate": 3.6865734152897987e-05, "epoch": 0.69, "percentage": 34.26, "elapsed_time": "6:28:16", "remaining_time": "12:25:05"} +{"current_steps": 2420, "total_steps": 7064, "loss": 0.8079, "reward": null, "learning_rate": 3.6865734152897987e-05, "epoch": 0.69, "percentage": 34.26, "elapsed_time": "6:28:16", "remaining_time": "12:25:06"} +{"current_steps": 2420, "total_steps": 7064, "loss": 0.8079, "reward": null, "learning_rate": 3.6865734152897987e-05, "epoch": 0.69, "percentage": 34.26, "elapsed_time": "6:28:15", "remaining_time": "12:25:03"} +{"current_steps": 2430, "total_steps": 7064, "loss": 0.821, "reward": null, "learning_rate": 3.676775525738213e-05, "epoch": 0.69, "percentage": 34.4, "elapsed_time": "6:29:55", "remaining_time": "12:23:35"} +{"current_steps": 2430, "total_steps": 7064, "loss": 0.821, "reward": null, "learning_rate": 3.676775525738213e-05, "epoch": 0.69, "percentage": 34.4, "elapsed_time": "6:29:56", "remaining_time": "12:23:37"} +{"current_steps": 2430, "total_steps": 7064, "loss": 0.821, "reward": null, "learning_rate": 3.676775525738213e-05, "epoch": 0.69, "percentage": 34.4, "elapsed_time": "6:29:54", "remaining_time": "12:23:34"} +{"current_steps": 2430, "total_steps": 7064, "loss": 0.821, "reward": null, "learning_rate": 3.676775525738213e-05, "epoch": 0.69, "percentage": 34.4, "elapsed_time": "6:33:49", "remaining_time": "12:31:01"} +{"current_steps": 2440, "total_steps": 7064, "loss": 0.8097, "reward": null, "learning_rate": 3.666954361101616e-05, "epoch": 0.69, "percentage": 34.54, "elapsed_time": "6:31:36", "remaining_time": "12:22:08"} +{"current_steps": 2440, "total_steps": 7064, "loss": 0.8097, "reward": null, "learning_rate": 3.666954361101616e-05, "epoch": 0.69, "percentage": 34.54, "elapsed_time": "6:31:36", "remaining_time": "12:22:07"} +{"current_steps": 2440, "total_steps": 7064, "loss": 0.8097, "reward": null, "learning_rate": 3.666954361101616e-05, "epoch": 0.69, "percentage": 34.54, "elapsed_time": "6:31:35", "remaining_time": "12:22:05"} +{"current_steps": 2440, "total_steps": 7064, "loss": 0.8097, "reward": null, "learning_rate": 3.666954361101616e-05, "epoch": 0.69, "percentage": 34.54, "elapsed_time": "6:35:29", "remaining_time": "12:29:29"} +{"current_steps": 2450, "total_steps": 7064, "loss": 0.8046, "reward": null, "learning_rate": 3.657110115629832e-05, "epoch": 0.69, "percentage": 34.68, "elapsed_time": "6:33:13", "remaining_time": "12:20:33"} +{"current_steps": 2450, "total_steps": 7064, "loss": 0.8046, "reward": null, "learning_rate": 3.657110115629832e-05, "epoch": 0.69, "percentage": 34.68, "elapsed_time": "6:33:13", "remaining_time": "12:20:31"} +{"current_steps": 2450, "total_steps": 7064, "loss": 0.8046, "reward": null, "learning_rate": 3.657110115629832e-05, "epoch": 0.69, "percentage": 34.68, "elapsed_time": "6:33:14", "remaining_time": "12:20:35"} +{"current_steps": 2450, "total_steps": 7064, "loss": 0.8046, "reward": null, "learning_rate": 3.657110115629832e-05, "epoch": 0.69, "percentage": 34.68, "elapsed_time": "6:37:07", "remaining_time": "12:27:53"} +{"current_steps": 2460, "total_steps": 7064, "loss": 0.8112, "reward": null, "learning_rate": 3.647242984029201e-05, "epoch": 0.7, "percentage": 34.82, "elapsed_time": "6:34:49", "remaining_time": "12:18:56"} +{"current_steps": 2460, "total_steps": 7064, "loss": 0.8112, "reward": null, "learning_rate": 3.647242984029201e-05, "epoch": 0.7, "percentage": 34.82, "elapsed_time": "6:38:43", "remaining_time": "12:26:13"} +{"current_steps": 2460, "total_steps": 7064, "loss": 0.8112, "reward": null, "learning_rate": 3.647242984029201e-05, "epoch": 0.7, "percentage": 34.82, "elapsed_time": "6:34:48", "remaining_time": "12:18:54"} +{"current_steps": 2460, "total_steps": 7064, "loss": 0.8112, "reward": null, "learning_rate": 3.647242984029201e-05, "epoch": 0.7, "percentage": 34.82, "elapsed_time": "6:34:50", "remaining_time": "12:18:58"} +{"current_steps": 2470, "total_steps": 7064, "loss": 0.8099, "reward": null, "learning_rate": 3.637353161458713e-05, "epoch": 0.7, "percentage": 34.97, "elapsed_time": "6:40:16", "remaining_time": "12:24:29"} +{"current_steps": 2470, "total_steps": 7064, "loss": 0.8099, "reward": null, "learning_rate": 3.637353161458713e-05, "epoch": 0.7, "percentage": 34.97, "elapsed_time": "6:36:23", "remaining_time": "12:17:14"} +{"current_steps": 2470, "total_steps": 7064, "loss": 0.8099, "reward": null, "learning_rate": 3.637353161458713e-05, "epoch": 0.7, "percentage": 34.97, "elapsed_time": "6:36:23", "remaining_time": "12:17:16"} +{"current_steps": 2470, "total_steps": 7064, "loss": 0.8099, "reward": null, "learning_rate": 3.637353161458713e-05, "epoch": 0.7, "percentage": 34.97, "elapsed_time": "6:36:22", "remaining_time": "12:17:13"} +{"current_steps": 2480, "total_steps": 7064, "loss": 0.8148, "reward": null, "learning_rate": 3.627440843526158e-05, "epoch": 0.7, "percentage": 35.11, "elapsed_time": "6:41:57", "remaining_time": "12:22:59"} +{"current_steps": 2480, "total_steps": 7064, "loss": 0.8148, "reward": null, "learning_rate": 3.627440843526158e-05, "epoch": 0.7, "percentage": 35.11, "elapsed_time": "6:38:04", "remaining_time": "12:15:48"} +{"current_steps": 2480, "total_steps": 7064, "loss": 0.8148, "reward": null, "learning_rate": 3.627440843526158e-05, "epoch": 0.7, "percentage": 35.11, "elapsed_time": "6:38:03", "remaining_time": "12:15:45"} +{"current_steps": 2480, "total_steps": 7064, "loss": 0.8148, "reward": null, "learning_rate": 3.627440843526158e-05, "epoch": 0.7, "percentage": 35.11, "elapsed_time": "6:38:04", "remaining_time": "12:15:47"} +{"current_steps": 2490, "total_steps": 7064, "loss": 0.8105, "reward": null, "learning_rate": 3.6175062262842585e-05, "epoch": 0.7, "percentage": 35.25, "elapsed_time": "6:39:40", "remaining_time": "12:14:11"} +{"current_steps": 2490, "total_steps": 7064, "loss": 0.8105, "reward": null, "learning_rate": 3.6175062262842585e-05, "epoch": 0.7, "percentage": 35.25, "elapsed_time": "6:39:39", "remaining_time": "12:14:09"} +{"current_steps": 2490, "total_steps": 7064, "loss": 0.8105, "reward": null, "learning_rate": 3.6175062262842585e-05, "epoch": 0.7, "percentage": 35.25, "elapsed_time": "6:39:41", "remaining_time": "12:14:12"} +{"current_steps": 2490, "total_steps": 7064, "loss": 0.8105, "reward": null, "learning_rate": 3.6175062262842585e-05, "epoch": 0.7, "percentage": 35.25, "elapsed_time": "6:43:34", "remaining_time": "12:21:20"} +{"current_steps": 2500, "total_steps": 7064, "loss": 0.8132, "reward": null, "learning_rate": 3.607549506226784e-05, "epoch": 0.71, "percentage": 35.39, "elapsed_time": "6:41:14", "remaining_time": "12:12:30"} +{"current_steps": 2500, "total_steps": 7064, "loss": 0.8132, "reward": null, "learning_rate": 3.607549506226784e-05, "epoch": 0.71, "percentage": 35.39, "elapsed_time": "6:41:13", "remaining_time": "12:12:28"} +{"current_steps": 2500, "total_steps": 7064, "loss": 0.8132, "reward": null, "learning_rate": 3.607549506226784e-05, "epoch": 0.71, "percentage": 35.39, "elapsed_time": "6:41:15", "remaining_time": "12:12:31"} +{"current_steps": 2500, "total_steps": 7064, "loss": 0.8132, "reward": null, "learning_rate": 3.607549506226784e-05, "epoch": 0.71, "percentage": 35.39, "elapsed_time": "6:45:08", "remaining_time": "12:19:36"} +{"current_steps": 2510, "total_steps": 7064, "loss": 0.8149, "reward": null, "learning_rate": 3.5975708802846725e-05, "epoch": 0.71, "percentage": 35.53, "elapsed_time": "6:42:53", "remaining_time": "12:10:59"} +{"current_steps": 2510, "total_steps": 7064, "loss": 0.8149, "reward": null, "learning_rate": 3.5975708802846725e-05, "epoch": 0.71, "percentage": 35.53, "elapsed_time": "6:46:47", "remaining_time": "12:18:03"} +{"current_steps": 2510, "total_steps": 7064, "loss": 0.8149, "reward": null, "learning_rate": 3.5975708802846725e-05, "epoch": 0.71, "percentage": 35.53, "elapsed_time": "6:42:54", "remaining_time": "12:11:00"} +{"current_steps": 2510, "total_steps": 7064, "loss": 0.8149, "reward": null, "learning_rate": 3.5975708802846725e-05, "epoch": 0.71, "percentage": 35.53, "elapsed_time": "6:42:52", "remaining_time": "12:10:57"} +{"current_steps": 2520, "total_steps": 7064, "loss": 0.8306, "reward": null, "learning_rate": 3.587570545822128e-05, "epoch": 0.71, "percentage": 35.67, "elapsed_time": "6:48:24", "remaining_time": "12:16:26"} +{"current_steps": 2520, "total_steps": 7064, "loss": 0.8306, "reward": null, "learning_rate": 3.587570545822128e-05, "epoch": 0.71, "percentage": 35.67, "elapsed_time": "6:44:31", "remaining_time": "12:09:26"} +{"current_steps": 2520, "total_steps": 7064, "loss": 0.8306, "reward": null, "learning_rate": 3.587570545822128e-05, "epoch": 0.71, "percentage": 35.67, "elapsed_time": "6:44:30", "remaining_time": "12:09:24"} +{"current_steps": 2520, "total_steps": 7064, "loss": 0.8306, "reward": null, "learning_rate": 3.587570545822128e-05, "epoch": 0.71, "percentage": 35.67, "elapsed_time": "6:44:30", "remaining_time": "12:09:23"} +{"current_steps": 2530, "total_steps": 7064, "loss": 0.8106, "reward": null, "learning_rate": 3.5775487006327215e-05, "epoch": 0.72, "percentage": 35.82, "elapsed_time": "6:49:58", "remaining_time": "12:14:43"} +{"current_steps": 2530, "total_steps": 7064, "loss": 0.8106, "reward": null, "learning_rate": 3.5775487006327215e-05, "epoch": 0.72, "percentage": 35.82, "elapsed_time": "6:46:05", "remaining_time": "12:07:45"} +{"current_steps": 2530, "total_steps": 7064, "loss": 0.8106, "reward": null, "learning_rate": 3.5775487006327215e-05, "epoch": 0.72, "percentage": 35.82, "elapsed_time": "6:46:04", "remaining_time": "12:07:42"} +{"current_steps": 2530, "total_steps": 7064, "loss": 0.8106, "reward": null, "learning_rate": 3.5775487006327215e-05, "epoch": 0.72, "percentage": 35.82, "elapsed_time": "6:46:05", "remaining_time": "12:07:44"} +{"current_steps": 2540, "total_steps": 7064, "loss": 0.8192, "reward": null, "learning_rate": 3.567505542935482e-05, "epoch": 0.72, "percentage": 35.96, "elapsed_time": "6:47:40", "remaining_time": "12:06:06"} +{"current_steps": 2540, "total_steps": 7064, "loss": 0.8192, "reward": null, "learning_rate": 3.567505542935482e-05, "epoch": 0.72, "percentage": 35.96, "elapsed_time": "6:51:34", "remaining_time": "12:13:02"} +{"current_steps": 2540, "total_steps": 7064, "loss": 0.8192, "reward": null, "learning_rate": 3.567505542935482e-05, "epoch": 0.72, "percentage": 35.96, "elapsed_time": "6:47:39", "remaining_time": "12:06:05"} +{"current_steps": 2540, "total_steps": 7064, "loss": 0.8192, "reward": null, "learning_rate": 3.567505542935482e-05, "epoch": 0.72, "percentage": 35.96, "elapsed_time": "6:47:41", "remaining_time": "12:06:08"} +{"current_steps": 2550, "total_steps": 7064, "loss": 0.8129, "reward": null, "learning_rate": 3.557441271370968e-05, "epoch": 0.72, "percentage": 36.1, "elapsed_time": "6:53:08", "remaining_time": "12:11:21"} +{"current_steps": 2550, "total_steps": 7064, "loss": 0.8129, "reward": null, "learning_rate": 3.557441271370968e-05, "epoch": 0.72, "percentage": 36.1, "elapsed_time": "6:49:15", "remaining_time": "12:04:28"} +{"current_steps": 2550, "total_steps": 7064, "loss": 0.8129, "reward": null, "learning_rate": 3.557441271370968e-05, "epoch": 0.72, "percentage": 36.1, "elapsed_time": "6:49:14", "remaining_time": "12:04:25"} +{"current_steps": 2550, "total_steps": 7064, "loss": 0.8129, "reward": null, "learning_rate": 3.557441271370968e-05, "epoch": 0.72, "percentage": 36.1, "elapsed_time": "6:49:15", "remaining_time": "12:04:27"} +{"current_steps": 2560, "total_steps": 7064, "loss": 0.8155, "reward": null, "learning_rate": 3.547356084997344e-05, "epoch": 0.72, "percentage": 36.24, "elapsed_time": "6:50:54", "remaining_time": "12:02:56"} +{"current_steps": 2560, "total_steps": 7064, "loss": 0.8155, "reward": null, "learning_rate": 3.547356084997344e-05, "epoch": 0.72, "percentage": 36.24, "elapsed_time": "6:54:48", "remaining_time": "12:09:47"} +{"current_steps": 2560, "total_steps": 7064, "loss": 0.8155, "reward": null, "learning_rate": 3.547356084997344e-05, "epoch": 0.72, "percentage": 36.24, "elapsed_time": "6:50:55", "remaining_time": "12:02:57"} +{"current_steps": 2560, "total_steps": 7064, "loss": 0.8155, "reward": null, "learning_rate": 3.547356084997344e-05, "epoch": 0.72, "percentage": 36.24, "elapsed_time": "6:50:53", "remaining_time": "12:02:54"} +{"current_steps": 2570, "total_steps": 7064, "loss": 0.8039, "reward": null, "learning_rate": 3.537250183286443e-05, "epoch": 0.73, "percentage": 36.38, "elapsed_time": "6:52:31", "remaining_time": "12:01:21"} +{"current_steps": 2570, "total_steps": 7064, "loss": 0.8039, "reward": null, "learning_rate": 3.537250183286443e-05, "epoch": 0.73, "percentage": 36.38, "elapsed_time": "6:56:25", "remaining_time": "12:08:10"} +{"current_steps": 2570, "total_steps": 7064, "loss": 0.8039, "reward": null, "learning_rate": 3.537250183286443e-05, "epoch": 0.73, "percentage": 36.38, "elapsed_time": "6:52:30", "remaining_time": "12:01:20"} +{"current_steps": 2570, "total_steps": 7064, "loss": 0.8039, "reward": null, "learning_rate": 3.537250183286443e-05, "epoch": 0.73, "percentage": 36.38, "elapsed_time": "6:52:32", "remaining_time": "12:01:23"} +{"current_steps": 2580, "total_steps": 7064, "loss": 0.8109, "reward": null, "learning_rate": 3.527123766119818e-05, "epoch": 0.73, "percentage": 36.52, "elapsed_time": "6:58:02", "remaining_time": "12:06:33"} +{"current_steps": 2580, "total_steps": 7064, "loss": 0.8109, "reward": null, "learning_rate": 3.527123766119818e-05, "epoch": 0.73, "percentage": 36.52, "elapsed_time": "6:54:09", "remaining_time": "11:59:47"} +{"current_steps": 2580, "total_steps": 7064, "loss": 0.8109, "reward": null, "learning_rate": 3.527123766119818e-05, "epoch": 0.73, "percentage": 36.52, "elapsed_time": "6:54:08", "remaining_time": "11:59:45"} +{"current_steps": 2580, "total_steps": 7064, "loss": 0.8109, "reward": null, "learning_rate": 3.527123766119818e-05, "epoch": 0.73, "percentage": 36.52, "elapsed_time": "6:54:09", "remaining_time": "11:59:48"} +{"current_steps": 2590, "total_steps": 7064, "loss": 0.8063, "reward": null, "learning_rate": 3.5169770337847935e-05, "epoch": 0.73, "percentage": 36.66, "elapsed_time": "6:55:44", "remaining_time": "11:58:09"} +{"current_steps": 2590, "total_steps": 7064, "loss": 0.8063, "reward": null, "learning_rate": 3.5169770337847935e-05, "epoch": 0.73, "percentage": 36.66, "elapsed_time": "6:55:45", "remaining_time": "11:58:10"} +{"current_steps": 2590, "total_steps": 7064, "loss": 0.8063, "reward": null, "learning_rate": 3.5169770337847935e-05, "epoch": 0.73, "percentage": 36.66, "elapsed_time": "6:55:43", "remaining_time": "11:58:07"} +{"current_steps": 2590, "total_steps": 7064, "loss": 0.8063, "reward": null, "learning_rate": 3.5169770337847935e-05, "epoch": 0.73, "percentage": 36.66, "elapsed_time": "6:59:38", "remaining_time": "12:04:52"} +{"current_steps": 2600, "total_steps": 7064, "loss": 0.8275, "reward": null, "learning_rate": 3.5068101869705004e-05, "epoch": 0.74, "percentage": 36.81, "elapsed_time": "7:01:15", "remaining_time": "12:03:15"} +{"current_steps": 2600, "total_steps": 7064, "loss": 0.8275, "reward": null, "learning_rate": 3.5068101869705004e-05, "epoch": 0.74, "percentage": 36.81, "elapsed_time": "6:57:22", "remaining_time": "11:56:35"} +{"current_steps": 2600, "total_steps": 7064, "loss": 0.8275, "reward": null, "learning_rate": 3.5068101869705004e-05, "epoch": 0.74, "percentage": 36.81, "elapsed_time": "6:57:20", "remaining_time": "11:56:32"} +{"current_steps": 2600, "total_steps": 7064, "loss": 0.8275, "reward": null, "learning_rate": 3.5068101869705004e-05, "epoch": 0.74, "percentage": 36.81, "elapsed_time": "6:57:21", "remaining_time": "11:56:34"} +{"current_steps": 2610, "total_steps": 7064, "loss": 0.8107, "reward": null, "learning_rate": 3.496623426763908e-05, "epoch": 0.74, "percentage": 36.95, "elapsed_time": "7:02:52", "remaining_time": "12:01:39"} +{"current_steps": 2610, "total_steps": 7064, "loss": 0.8107, "reward": null, "learning_rate": 3.496623426763908e-05, "epoch": 0.74, "percentage": 36.95, "elapsed_time": "6:58:58", "remaining_time": "11:54:58"} +{"current_steps": 2610, "total_steps": 7064, "loss": 0.8107, "reward": null, "learning_rate": 3.496623426763908e-05, "epoch": 0.74, "percentage": 36.95, "elapsed_time": "6:58:59", "remaining_time": "11:55:01"} +{"current_steps": 2610, "total_steps": 7064, "loss": 0.8107, "reward": null, "learning_rate": 3.496623426763908e-05, "epoch": 0.74, "percentage": 36.95, "elapsed_time": "6:58:59", "remaining_time": "11:55:00"} +{"current_steps": 2620, "total_steps": 7064, "loss": 0.8047, "reward": null, "learning_rate": 3.486416954645846e-05, "epoch": 0.74, "percentage": 37.09, "elapsed_time": "7:00:38", "remaining_time": "11:53:29"} +{"current_steps": 2620, "total_steps": 7064, "loss": 0.8047, "reward": null, "learning_rate": 3.486416954645846e-05, "epoch": 0.74, "percentage": 37.09, "elapsed_time": "7:00:39", "remaining_time": "11:53:30"} +{"current_steps": 2620, "total_steps": 7064, "loss": 0.8047, "reward": null, "learning_rate": 3.486416954645846e-05, "epoch": 0.74, "percentage": 37.09, "elapsed_time": "7:00:37", "remaining_time": "11:53:27"} +{"current_steps": 2620, "total_steps": 7064, "loss": 0.8047, "reward": null, "learning_rate": 3.486416954645846e-05, "epoch": 0.74, "percentage": 37.09, "elapsed_time": "7:04:32", "remaining_time": "12:00:05"} +{"current_steps": 2630, "total_steps": 7064, "loss": 0.8123, "reward": null, "learning_rate": 3.4761909724870205e-05, "epoch": 0.74, "percentage": 37.23, "elapsed_time": "7:02:19", "remaining_time": "11:51:59"} +{"current_steps": 2630, "total_steps": 7064, "loss": 0.8123, "reward": null, "learning_rate": 3.4761909724870205e-05, "epoch": 0.74, "percentage": 37.23, "elapsed_time": "7:06:12", "remaining_time": "11:58:33"} +{"current_steps": 2630, "total_steps": 7064, "loss": 0.8123, "reward": null, "learning_rate": 3.4761909724870205e-05, "epoch": 0.74, "percentage": 37.23, "elapsed_time": "7:02:18", "remaining_time": "11:51:58"} +{"current_steps": 2630, "total_steps": 7064, "loss": 0.8123, "reward": null, "learning_rate": 3.4761909724870205e-05, "epoch": 0.74, "percentage": 37.23, "elapsed_time": "7:02:19", "remaining_time": "11:52:01"} +{"current_steps": 2640, "total_steps": 7064, "loss": 0.8241, "reward": null, "learning_rate": 3.4659456825440216e-05, "epoch": 0.75, "percentage": 37.37, "elapsed_time": "7:03:53", "remaining_time": "11:50:20"} +{"current_steps": 2640, "total_steps": 7064, "loss": 0.8241, "reward": null, "learning_rate": 3.4659456825440216e-05, "epoch": 0.75, "percentage": 37.37, "elapsed_time": "7:03:54", "remaining_time": "11:50:21"} +{"current_steps": 2640, "total_steps": 7064, "loss": 0.8241, "reward": null, "learning_rate": 3.4659456825440216e-05, "epoch": 0.75, "percentage": 37.37, "elapsed_time": "7:07:47", "remaining_time": "11:56:51"} +{"current_steps": 2640, "total_steps": 7064, "loss": 0.8241, "reward": null, "learning_rate": 3.4659456825440216e-05, "epoch": 0.75, "percentage": 37.37, "elapsed_time": "7:03:52", "remaining_time": "11:50:18"} +{"current_steps": 2650, "total_steps": 7064, "loss": 0.812, "reward": null, "learning_rate": 3.4556812874553204e-05, "epoch": 0.75, "percentage": 37.51, "elapsed_time": "7:09:24", "remaining_time": "11:55:15"} +{"current_steps": 2650, "total_steps": 7064, "loss": 0.812, "reward": null, "learning_rate": 3.4556812874553204e-05, "epoch": 0.75, "percentage": 37.51, "elapsed_time": "7:05:31", "remaining_time": "11:48:47"} +{"current_steps": 2650, "total_steps": 7064, "loss": 0.812, "reward": null, "learning_rate": 3.4556812874553204e-05, "epoch": 0.75, "percentage": 37.51, "elapsed_time": "7:05:30", "remaining_time": "11:48:44"} +{"current_steps": 2650, "total_steps": 7064, "loss": 0.812, "reward": null, "learning_rate": 3.4556812874553204e-05, "epoch": 0.75, "percentage": 37.51, "elapsed_time": "7:05:31", "remaining_time": "11:48:46"} +{"current_steps": 2660, "total_steps": 7064, "loss": 0.8161, "reward": null, "learning_rate": 3.445397990237264e-05, "epoch": 0.75, "percentage": 37.66, "elapsed_time": "7:07:05", "remaining_time": "11:47:06"} +{"current_steps": 2660, "total_steps": 7064, "loss": 0.8161, "reward": null, "learning_rate": 3.445397990237264e-05, "epoch": 0.75, "percentage": 37.66, "elapsed_time": "7:07:06", "remaining_time": "11:47:07"} +{"current_steps": 2660, "total_steps": 7064, "loss": 0.8161, "reward": null, "learning_rate": 3.445397990237264e-05, "epoch": 0.75, "percentage": 37.66, "elapsed_time": "7:07:04", "remaining_time": "11:47:05"} +{"current_steps": 2660, "total_steps": 7064, "loss": 0.8161, "reward": null, "learning_rate": 3.445397990237264e-05, "epoch": 0.75, "percentage": 37.66, "elapsed_time": "7:10:59", "remaining_time": "11:53:33"} +{"current_steps": 2670, "total_steps": 7064, "loss": 0.797, "reward": null, "learning_rate": 3.4350959942800584e-05, "epoch": 0.76, "percentage": 37.8, "elapsed_time": "7:08:41", "remaining_time": "11:45:29"} +{"current_steps": 2670, "total_steps": 7064, "loss": 0.797, "reward": null, "learning_rate": 3.4350959942800584e-05, "epoch": 0.76, "percentage": 37.8, "elapsed_time": "7:12:35", "remaining_time": "11:51:54"} +{"current_steps": 2670, "total_steps": 7064, "loss": 0.797, "reward": null, "learning_rate": 3.4350959942800584e-05, "epoch": 0.76, "percentage": 37.8, "elapsed_time": "7:08:42", "remaining_time": "11:45:31"} +{"current_steps": 2670, "total_steps": 7064, "loss": 0.797, "reward": null, "learning_rate": 3.4350959942800584e-05, "epoch": 0.76, "percentage": 37.8, "elapsed_time": "7:08:40", "remaining_time": "11:45:28"} +{"current_steps": 2680, "total_steps": 7064, "loss": 0.8155, "reward": null, "learning_rate": 3.424775503343747e-05, "epoch": 0.76, "percentage": 37.94, "elapsed_time": "7:10:15", "remaining_time": "11:43:49"} +{"current_steps": 2680, "total_steps": 7064, "loss": 0.8155, "reward": null, "learning_rate": 3.424775503343747e-05, "epoch": 0.76, "percentage": 37.94, "elapsed_time": "7:10:14", "remaining_time": "11:43:47"} +{"current_steps": 2680, "total_steps": 7064, "loss": 0.8155, "reward": null, "learning_rate": 3.424775503343747e-05, "epoch": 0.76, "percentage": 37.94, "elapsed_time": "7:10:16", "remaining_time": "11:43:50"} +{"current_steps": 2680, "total_steps": 7064, "loss": 0.8155, "reward": null, "learning_rate": 3.424775503343747e-05, "epoch": 0.76, "percentage": 37.94, "elapsed_time": "7:14:09", "remaining_time": "11:50:11"} +{"current_steps": 2690, "total_steps": 7064, "loss": 0.797, "reward": null, "learning_rate": 3.414436721554179e-05, "epoch": 0.76, "percentage": 38.08, "elapsed_time": "7:11:51", "remaining_time": "11:42:12"} +{"current_steps": 2690, "total_steps": 7064, "loss": 0.797, "reward": null, "learning_rate": 3.414436721554179e-05, "epoch": 0.76, "percentage": 38.08, "elapsed_time": "7:15:45", "remaining_time": "11:48:32"} +{"current_steps": 2690, "total_steps": 7064, "loss": 0.797, "reward": null, "learning_rate": 3.414436721554179e-05, "epoch": 0.76, "percentage": 38.08, "elapsed_time": "7:11:50", "remaining_time": "11:42:11"} +{"current_steps": 2690, "total_steps": 7064, "loss": 0.797, "reward": null, "learning_rate": 3.414436721554179e-05, "epoch": 0.76, "percentage": 38.08, "elapsed_time": "7:11:52", "remaining_time": "11:42:14"} +{"current_steps": 2700, "total_steps": 7064, "loss": 0.8153, "reward": null, "learning_rate": 3.4040798533989745e-05, "epoch": 0.76, "percentage": 38.22, "elapsed_time": "7:13:30", "remaining_time": "11:40:40"} +{"current_steps": 2700, "total_steps": 7064, "loss": 0.8153, "reward": null, "learning_rate": 3.4040798533989745e-05, "epoch": 0.76, "percentage": 38.22, "elapsed_time": "7:13:29", "remaining_time": "11:40:38"} +{"current_steps": 2700, "total_steps": 7064, "loss": 0.8153, "reward": null, "learning_rate": 3.4040798533989745e-05, "epoch": 0.76, "percentage": 38.22, "elapsed_time": "7:17:23", "remaining_time": "11:46:57"} +{"current_steps": 2700, "total_steps": 7064, "loss": 0.8153, "reward": null, "learning_rate": 3.4040798533989745e-05, "epoch": 0.76, "percentage": 38.22, "elapsed_time": "7:13:30", "remaining_time": "11:40:41"} +{"current_steps": 2710, "total_steps": 7064, "loss": 0.8016, "reward": null, "learning_rate": 3.3937051037234745e-05, "epoch": 0.77, "percentage": 38.36, "elapsed_time": "7:19:02", "remaining_time": "11:45:22"} +{"current_steps": 2710, "total_steps": 7064, "loss": 0.8016, "reward": null, "learning_rate": 3.3937051037234745e-05, "epoch": 0.77, "percentage": 38.36, "elapsed_time": "7:15:09", "remaining_time": "11:39:08"} +{"current_steps": 2710, "total_steps": 7064, "loss": 0.8016, "reward": null, "learning_rate": 3.3937051037234745e-05, "epoch": 0.77, "percentage": 38.36, "elapsed_time": "7:15:07", "remaining_time": "11:39:05"} +{"current_steps": 2710, "total_steps": 7064, "loss": 0.8016, "reward": null, "learning_rate": 3.3937051037234745e-05, "epoch": 0.77, "percentage": 38.36, "elapsed_time": "7:15:08", "remaining_time": "11:39:07"} +{"current_steps": 2720, "total_steps": 7064, "loss": 0.8138, "reward": null, "learning_rate": 3.3833126777266974e-05, "epoch": 0.77, "percentage": 38.51, "elapsed_time": "7:20:39", "remaining_time": "11:43:45"} +{"current_steps": 2720, "total_steps": 7064, "loss": 0.8138, "reward": null, "learning_rate": 3.3833126777266974e-05, "epoch": 0.77, "percentage": 38.51, "elapsed_time": "7:16:46", "remaining_time": "11:37:33"} +{"current_steps": 2720, "total_steps": 7064, "loss": 0.8138, "reward": null, "learning_rate": 3.3833126777266974e-05, "epoch": 0.77, "percentage": 38.51, "elapsed_time": "7:16:44", "remaining_time": "11:37:30"} +{"current_steps": 2720, "total_steps": 7064, "loss": 0.8138, "reward": null, "learning_rate": 3.3833126777266974e-05, "epoch": 0.77, "percentage": 38.51, "elapsed_time": "7:16:45", "remaining_time": "11:37:32"} +{"current_steps": 2730, "total_steps": 7064, "loss": 0.8178, "reward": null, "learning_rate": 3.3729027809572735e-05, "epoch": 0.77, "percentage": 38.65, "elapsed_time": "7:18:24", "remaining_time": "11:35:59"} +{"current_steps": 2730, "total_steps": 7064, "loss": 0.8178, "reward": null, "learning_rate": 3.3729027809572735e-05, "epoch": 0.77, "percentage": 38.65, "elapsed_time": "7:18:23", "remaining_time": "11:35:58"} +{"current_steps": 2730, "total_steps": 7064, "loss": 0.8178, "reward": null, "learning_rate": 3.3729027809572735e-05, "epoch": 0.77, "percentage": 38.65, "elapsed_time": "7:18:25", "remaining_time": "11:36:01"} +{"current_steps": 2730, "total_steps": 7064, "loss": 0.8178, "reward": null, "learning_rate": 3.3729027809572735e-05, "epoch": 0.77, "percentage": 38.65, "elapsed_time": "7:22:18", "remaining_time": "11:42:10"} +{"current_steps": 2740, "total_steps": 7064, "loss": 0.8062, "reward": null, "learning_rate": 3.3624756193093835e-05, "epoch": 0.78, "percentage": 38.79, "elapsed_time": "7:23:53", "remaining_time": "11:40:30"} +{"current_steps": 2740, "total_steps": 7064, "loss": 0.8062, "reward": null, "learning_rate": 3.3624756193093835e-05, "epoch": 0.78, "percentage": 38.79, "elapsed_time": "7:20:00", "remaining_time": "11:34:22"} +{"current_steps": 2740, "total_steps": 7064, "loss": 0.8062, "reward": null, "learning_rate": 3.3624756193093835e-05, "epoch": 0.78, "percentage": 38.79, "elapsed_time": "7:19:58", "remaining_time": "11:34:20"} +{"current_steps": 2740, "total_steps": 7064, "loss": 0.8062, "reward": null, "learning_rate": 3.3624756193093835e-05, "epoch": 0.78, "percentage": 38.79, "elapsed_time": "7:19:59", "remaining_time": "11:34:21"} +{"current_steps": 2750, "total_steps": 7064, "loss": 0.8101, "reward": null, "learning_rate": 3.3520313990186856e-05, "epoch": 0.78, "percentage": 38.93, "elapsed_time": "7:21:36", "remaining_time": "11:32:45"} +{"current_steps": 2750, "total_steps": 7064, "loss": 0.8101, "reward": null, "learning_rate": 3.3520313990186856e-05, "epoch": 0.78, "percentage": 38.93, "elapsed_time": "7:21:35", "remaining_time": "11:32:44"} +{"current_steps": 2750, "total_steps": 7064, "loss": 0.8101, "reward": null, "learning_rate": 3.3520313990186856e-05, "epoch": 0.78, "percentage": 38.93, "elapsed_time": "7:21:37", "remaining_time": "11:32:47"} +{"current_steps": 2750, "total_steps": 7064, "loss": 0.8101, "reward": null, "learning_rate": 3.3520313990186856e-05, "epoch": 0.78, "percentage": 38.93, "elapsed_time": "7:25:30", "remaining_time": "11:38:52"} +{"current_steps": 2760, "total_steps": 7064, "loss": 0.7982, "reward": null, "learning_rate": 3.341570326658232e-05, "epoch": 0.78, "percentage": 39.07, "elapsed_time": "7:23:09", "remaining_time": "11:31:04"} +{"current_steps": 2760, "total_steps": 7064, "loss": 0.7982, "reward": null, "learning_rate": 3.341570326658232e-05, "epoch": 0.78, "percentage": 39.07, "elapsed_time": "7:27:02", "remaining_time": "11:37:08"} +{"current_steps": 2760, "total_steps": 7064, "loss": 0.7982, "reward": null, "learning_rate": 3.341570326658232e-05, "epoch": 0.78, "percentage": 39.07, "elapsed_time": "7:23:08", "remaining_time": "11:31:02"} +{"current_steps": 2760, "total_steps": 7064, "loss": 0.7982, "reward": null, "learning_rate": 3.341570326658232e-05, "epoch": 0.78, "percentage": 39.07, "elapsed_time": "7:23:09", "remaining_time": "11:31:03"} +{"current_steps": 2770, "total_steps": 7064, "loss": 0.8021, "reward": null, "learning_rate": 3.331092609134392e-05, "epoch": 0.78, "percentage": 39.21, "elapsed_time": "7:28:41", "remaining_time": "11:35:33"} +{"current_steps": 2770, "total_steps": 7064, "loss": 0.8021, "reward": null, "learning_rate": 3.331092609134392e-05, "epoch": 0.78, "percentage": 39.21, "elapsed_time": "7:24:47", "remaining_time": "11:29:29"} +{"current_steps": 2770, "total_steps": 7064, "loss": 0.8021, "reward": null, "learning_rate": 3.331092609134392e-05, "epoch": 0.78, "percentage": 39.21, "elapsed_time": "7:24:48", "remaining_time": "11:29:32"} +{"current_steps": 2770, "total_steps": 7064, "loss": 0.8021, "reward": null, "learning_rate": 3.331092609134392e-05, "epoch": 0.78, "percentage": 39.21, "elapsed_time": "7:24:48", "remaining_time": "11:29:31"} +{"current_steps": 2780, "total_steps": 7064, "loss": 0.817, "reward": null, "learning_rate": 3.32059845368275e-05, "epoch": 0.79, "percentage": 39.35, "elapsed_time": "7:30:20", "remaining_time": "11:33:58"} +{"current_steps": 2780, "total_steps": 7064, "loss": 0.817, "reward": null, "learning_rate": 3.32059845368275e-05, "epoch": 0.79, "percentage": 39.35, "elapsed_time": "7:26:26", "remaining_time": "11:27:58"} +{"current_steps": 2780, "total_steps": 7064, "loss": 0.817, "reward": null, "learning_rate": 3.32059845368275e-05, "epoch": 0.79, "percentage": 39.35, "elapsed_time": "7:26:25", "remaining_time": "11:27:57"} +{"current_steps": 2780, "total_steps": 7064, "loss": 0.817, "reward": null, "learning_rate": 3.32059845368275e-05, "epoch": 0.79, "percentage": 39.35, "elapsed_time": "7:26:27", "remaining_time": "11:27:59"} +{"current_steps": 2790, "total_steps": 7064, "loss": 0.8083, "reward": null, "learning_rate": 3.310088067864015e-05, "epoch": 0.79, "percentage": 39.5, "elapsed_time": "7:28:05", "remaining_time": "11:26:26"} +{"current_steps": 2790, "total_steps": 7064, "loss": 0.8083, "reward": null, "learning_rate": 3.310088067864015e-05, "epoch": 0.79, "percentage": 39.5, "elapsed_time": "7:28:06", "remaining_time": "11:26:27"} +{"current_steps": 2790, "total_steps": 7064, "loss": 0.8083, "reward": null, "learning_rate": 3.310088067864015e-05, "epoch": 0.79, "percentage": 39.5, "elapsed_time": "7:31:59", "remaining_time": "11:32:24"} +{"current_steps": 2790, "total_steps": 7064, "loss": 0.8083, "reward": null, "learning_rate": 3.310088067864015e-05, "epoch": 0.79, "percentage": 39.5, "elapsed_time": "7:28:04", "remaining_time": "11:26:24"} +{"current_steps": 2800, "total_steps": 7064, "loss": 0.8047, "reward": null, "learning_rate": 3.299561659559909e-05, "epoch": 0.79, "percentage": 39.64, "elapsed_time": "7:33:36", "remaining_time": "11:30:46"} +{"current_steps": 2800, "total_steps": 7064, "loss": 0.8047, "reward": null, "learning_rate": 3.299561659559909e-05, "epoch": 0.79, "percentage": 39.64, "elapsed_time": "7:29:43", "remaining_time": "11:24:51"} +{"current_steps": 2800, "total_steps": 7064, "loss": 0.8047, "reward": null, "learning_rate": 3.299561659559909e-05, "epoch": 0.79, "percentage": 39.64, "elapsed_time": "7:29:42", "remaining_time": "11:24:50"} +{"current_steps": 2800, "total_steps": 7064, "loss": 0.8047, "reward": null, "learning_rate": 3.299561659559909e-05, "epoch": 0.79, "percentage": 39.64, "elapsed_time": "7:29:41", "remaining_time": "11:24:49"} +{"current_steps": 2810, "total_steps": 7064, "loss": 0.8, "reward": null, "learning_rate": 3.289019436969057e-05, "epoch": 0.8, "percentage": 39.78, "elapsed_time": "7:35:14", "remaining_time": "11:29:10"} +{"current_steps": 2810, "total_steps": 7064, "loss": 0.8, "reward": null, "learning_rate": 3.289019436969057e-05, "epoch": 0.8, "percentage": 39.78, "elapsed_time": "7:31:21", "remaining_time": "11:23:17"} +{"current_steps": 2810, "total_steps": 7064, "loss": 0.8, "reward": null, "learning_rate": 3.289019436969057e-05, "epoch": 0.8, "percentage": 39.78, "elapsed_time": "7:31:19", "remaining_time": "11:23:14"} +{"current_steps": 2810, "total_steps": 7064, "loss": 0.8, "reward": null, "learning_rate": 3.289019436969057e-05, "epoch": 0.8, "percentage": 39.78, "elapsed_time": "7:31:20", "remaining_time": "11:23:16"} +{"current_steps": 2820, "total_steps": 7064, "loss": 0.8063, "reward": null, "learning_rate": 3.278461608602873e-05, "epoch": 0.8, "percentage": 39.92, "elapsed_time": "7:36:52", "remaining_time": "11:27:34"} +{"current_steps": 2820, "total_steps": 7064, "loss": 0.8063, "reward": null, "learning_rate": 3.278461608602873e-05, "epoch": 0.8, "percentage": 39.92, "elapsed_time": "7:32:58", "remaining_time": "11:21:42"} +{"current_steps": 2820, "total_steps": 7064, "loss": 0.8063, "reward": null, "learning_rate": 3.278461608602873e-05, "epoch": 0.8, "percentage": 39.92, "elapsed_time": "7:32:57", "remaining_time": "11:21:41"} +{"current_steps": 2820, "total_steps": 7064, "loss": 0.8063, "reward": null, "learning_rate": 3.278461608602873e-05, "epoch": 0.8, "percentage": 39.92, "elapsed_time": "7:32:59", "remaining_time": "11:21:43"} +{"current_steps": 2830, "total_steps": 7064, "loss": 0.8139, "reward": null, "learning_rate": 3.267888383281431e-05, "epoch": 0.8, "percentage": 40.06, "elapsed_time": "7:34:34", "remaining_time": "11:20:06"} +{"current_steps": 2830, "total_steps": 7064, "loss": 0.8139, "reward": null, "learning_rate": 3.267888383281431e-05, "epoch": 0.8, "percentage": 40.06, "elapsed_time": "7:38:28", "remaining_time": "11:25:55"} +{"current_steps": 2830, "total_steps": 7064, "loss": 0.8139, "reward": null, "learning_rate": 3.267888383281431e-05, "epoch": 0.8, "percentage": 40.06, "elapsed_time": "7:34:33", "remaining_time": "11:20:04"} +{"current_steps": 2830, "total_steps": 7064, "loss": 0.8139, "reward": null, "learning_rate": 3.267888383281431e-05, "epoch": 0.8, "percentage": 40.06, "elapsed_time": "7:34:35", "remaining_time": "11:20:07"} +{"current_steps": 2840, "total_steps": 7064, "loss": 0.8075, "reward": null, "learning_rate": 3.257299970129336e-05, "epoch": 0.8, "percentage": 40.2, "elapsed_time": "7:36:12", "remaining_time": "11:18:31"} +{"current_steps": 2840, "total_steps": 7064, "loss": 0.8075, "reward": null, "learning_rate": 3.257299970129336e-05, "epoch": 0.8, "percentage": 40.2, "elapsed_time": "7:36:13", "remaining_time": "11:18:32"} +{"current_steps": 2840, "total_steps": 7064, "loss": 0.8075, "reward": null, "learning_rate": 3.257299970129336e-05, "epoch": 0.8, "percentage": 40.2, "elapsed_time": "7:36:11", "remaining_time": "11:18:30"} +{"current_steps": 2840, "total_steps": 7064, "loss": 0.8075, "reward": null, "learning_rate": 3.257299970129336e-05, "epoch": 0.8, "percentage": 40.2, "elapsed_time": "7:40:06", "remaining_time": "11:24:19"} +{"current_steps": 2850, "total_steps": 7064, "loss": 0.8056, "reward": null, "learning_rate": 3.246696578571592e-05, "epoch": 0.81, "percentage": 40.35, "elapsed_time": "7:37:47", "remaining_time": "11:16:53"} +{"current_steps": 2850, "total_steps": 7064, "loss": 0.8056, "reward": null, "learning_rate": 3.246696578571592e-05, "epoch": 0.81, "percentage": 40.35, "elapsed_time": "7:37:48", "remaining_time": "11:16:54"} +{"current_steps": 2850, "total_steps": 7064, "loss": 0.8056, "reward": null, "learning_rate": 3.246696578571592e-05, "epoch": 0.81, "percentage": 40.35, "elapsed_time": "7:37:49", "remaining_time": "11:16:56"} +{"current_steps": 2850, "total_steps": 7064, "loss": 0.8056, "reward": null, "learning_rate": 3.246696578571592e-05, "epoch": 0.81, "percentage": 40.35, "elapsed_time": "7:41:42", "remaining_time": "11:22:40"} +{"current_steps": 2860, "total_steps": 7064, "loss": 0.8242, "reward": null, "learning_rate": 3.236078418329452e-05, "epoch": 0.81, "percentage": 40.49, "elapsed_time": "7:39:28", "remaining_time": "11:15:23"} +{"current_steps": 2860, "total_steps": 7064, "loss": 0.8242, "reward": null, "learning_rate": 3.236078418329452e-05, "epoch": 0.81, "percentage": 40.49, "elapsed_time": "7:39:28", "remaining_time": "11:15:24"} +{"current_steps": 2860, "total_steps": 7064, "loss": 0.8242, "reward": null, "learning_rate": 3.236078418329452e-05, "epoch": 0.81, "percentage": 40.49, "elapsed_time": "7:39:27", "remaining_time": "11:15:21"} +{"current_steps": 2860, "total_steps": 7064, "loss": 0.8242, "reward": null, "learning_rate": 3.236078418329452e-05, "epoch": 0.81, "percentage": 40.49, "elapsed_time": "7:43:21", "remaining_time": "11:21:06"} +{"current_steps": 2870, "total_steps": 7064, "loss": 0.8041, "reward": null, "learning_rate": 3.225445699416276e-05, "epoch": 0.81, "percentage": 40.63, "elapsed_time": "7:45:01", "remaining_time": "11:19:33"} +{"current_steps": 2870, "total_steps": 7064, "loss": 0.8041, "reward": null, "learning_rate": 3.225445699416276e-05, "epoch": 0.81, "percentage": 40.63, "elapsed_time": "7:41:07", "remaining_time": "11:13:50"} +{"current_steps": 2870, "total_steps": 7064, "loss": 0.8041, "reward": null, "learning_rate": 3.225445699416276e-05, "epoch": 0.81, "percentage": 40.63, "elapsed_time": "7:41:08", "remaining_time": "11:13:52"} +{"current_steps": 2870, "total_steps": 7064, "loss": 0.8041, "reward": null, "learning_rate": 3.225445699416276e-05, "epoch": 0.81, "percentage": 40.63, "elapsed_time": "7:41:07", "remaining_time": "11:13:51"} +{"current_steps": 2880, "total_steps": 7064, "loss": 0.8088, "reward": null, "learning_rate": 3.214798632133376e-05, "epoch": 0.82, "percentage": 40.77, "elapsed_time": "7:46:38", "remaining_time": "11:17:56"} +{"current_steps": 2880, "total_steps": 7064, "loss": 0.8088, "reward": null, "learning_rate": 3.214798632133376e-05, "epoch": 0.82, "percentage": 40.77, "elapsed_time": "7:42:45", "remaining_time": "11:12:16"} +{"current_steps": 2880, "total_steps": 7064, "loss": 0.8088, "reward": null, "learning_rate": 3.214798632133376e-05, "epoch": 0.82, "percentage": 40.77, "elapsed_time": "7:42:46", "remaining_time": "11:12:17"} +{"current_steps": 2880, "total_steps": 7064, "loss": 0.8088, "reward": null, "learning_rate": 3.214798632133376e-05, "epoch": 0.82, "percentage": 40.77, "elapsed_time": "7:42:44", "remaining_time": "11:12:15"} +{"current_steps": 2890, "total_steps": 7064, "loss": 0.8121, "reward": null, "learning_rate": 3.204137427065857e-05, "epoch": 0.82, "percentage": 40.91, "elapsed_time": "7:44:26", "remaining_time": "11:10:47"} +{"current_steps": 2890, "total_steps": 7064, "loss": 0.8121, "reward": null, "learning_rate": 3.204137427065857e-05, "epoch": 0.82, "percentage": 40.91, "elapsed_time": "7:48:20", "remaining_time": "11:16:25"} +{"current_steps": 2890, "total_steps": 7064, "loss": 0.8121, "reward": null, "learning_rate": 3.204137427065857e-05, "epoch": 0.82, "percentage": 40.91, "elapsed_time": "7:44:27", "remaining_time": "11:10:48"} +{"current_steps": 2890, "total_steps": 7064, "loss": 0.8121, "reward": null, "learning_rate": 3.204137427065857e-05, "epoch": 0.82, "percentage": 40.91, "elapsed_time": "7:44:25", "remaining_time": "11:10:46"} +{"current_steps": 2900, "total_steps": 7064, "loss": 0.8151, "reward": null, "learning_rate": 3.193462295078448e-05, "epoch": 0.82, "percentage": 41.05, "elapsed_time": "7:50:00", "remaining_time": "11:14:52"} +{"current_steps": 2900, "total_steps": 7064, "loss": 0.8151, "reward": null, "learning_rate": 3.193462295078448e-05, "epoch": 0.82, "percentage": 41.05, "elapsed_time": "7:46:07", "remaining_time": "11:09:16"} +{"current_steps": 2900, "total_steps": 7064, "loss": 0.8151, "reward": null, "learning_rate": 3.193462295078448e-05, "epoch": 0.82, "percentage": 41.05, "elapsed_time": "7:46:06", "remaining_time": "11:09:15"} +{"current_steps": 2900, "total_steps": 7064, "loss": 0.8151, "reward": null, "learning_rate": 3.193462295078448e-05, "epoch": 0.82, "percentage": 41.05, "elapsed_time": "7:46:07", "remaining_time": "11:09:18"} +{"current_steps": 2910, "total_steps": 7064, "loss": 0.8064, "reward": null, "learning_rate": 3.1827734473113356e-05, "epoch": 0.82, "percentage": 41.19, "elapsed_time": "7:47:44", "remaining_time": "11:07:42"} +{"current_steps": 2910, "total_steps": 7064, "loss": 0.8064, "reward": null, "learning_rate": 3.1827734473113356e-05, "epoch": 0.82, "percentage": 41.19, "elapsed_time": "7:47:43", "remaining_time": "11:07:40"} +{"current_steps": 2910, "total_steps": 7064, "loss": 0.8064, "reward": null, "learning_rate": 3.1827734473113356e-05, "epoch": 0.82, "percentage": 41.19, "elapsed_time": "7:47:45", "remaining_time": "11:07:43"} +{"current_steps": 2910, "total_steps": 7064, "loss": 0.8064, "reward": null, "learning_rate": 3.1827734473113356e-05, "epoch": 0.82, "percentage": 41.19, "elapsed_time": "7:51:38", "remaining_time": "11:13:15"} +{"current_steps": 2920, "total_steps": 7064, "loss": 0.8151, "reward": null, "learning_rate": 3.172071095175989e-05, "epoch": 0.83, "percentage": 41.34, "elapsed_time": "7:53:15", "remaining_time": "11:11:38"} +{"current_steps": 2920, "total_steps": 7064, "loss": 0.8151, "reward": null, "learning_rate": 3.172071095175989e-05, "epoch": 0.83, "percentage": 41.34, "elapsed_time": "7:49:22", "remaining_time": "11:06:06"} +{"current_steps": 2920, "total_steps": 7064, "loss": 0.8151, "reward": null, "learning_rate": 3.172071095175989e-05, "epoch": 0.83, "percentage": 41.34, "elapsed_time": "7:49:21", "remaining_time": "11:06:05"} +{"current_steps": 2920, "total_steps": 7064, "loss": 0.8151, "reward": null, "learning_rate": 3.172071095175989e-05, "epoch": 0.83, "percentage": 41.34, "elapsed_time": "7:49:22", "remaining_time": "11:06:08"} +{"current_steps": 2930, "total_steps": 7064, "loss": 0.7942, "reward": null, "learning_rate": 3.1613554503509715e-05, "epoch": 0.83, "percentage": 41.48, "elapsed_time": "7:51:00", "remaining_time": "11:04:32"} +{"current_steps": 2930, "total_steps": 7064, "loss": 0.7942, "reward": null, "learning_rate": 3.1613554503509715e-05, "epoch": 0.83, "percentage": 41.48, "elapsed_time": "7:50:58", "remaining_time": "11:04:30"} +{"current_steps": 2930, "total_steps": 7064, "loss": 0.7942, "reward": null, "learning_rate": 3.1613554503509715e-05, "epoch": 0.83, "percentage": 41.48, "elapsed_time": "7:54:53", "remaining_time": "11:10:01"} +{"current_steps": 2930, "total_steps": 7064, "loss": 0.7942, "reward": null, "learning_rate": 3.1613554503509715e-05, "epoch": 0.83, "percentage": 41.48, "elapsed_time": "7:50:59", "remaining_time": "11:04:31"} +{"current_steps": 2940, "total_steps": 7064, "loss": 0.8131, "reward": null, "learning_rate": 3.1506267247777645e-05, "epoch": 0.83, "percentage": 41.62, "elapsed_time": "7:52:38", "remaining_time": "11:02:59"} +{"current_steps": 2940, "total_steps": 7064, "loss": 0.8131, "reward": null, "learning_rate": 3.1506267247777645e-05, "epoch": 0.83, "percentage": 41.62, "elapsed_time": "7:52:39", "remaining_time": "11:03:00"} +{"current_steps": 2940, "total_steps": 7064, "loss": 0.8131, "reward": null, "learning_rate": 3.1506267247777645e-05, "epoch": 0.83, "percentage": 41.62, "elapsed_time": "7:52:37", "remaining_time": "11:02:58"} +{"current_steps": 2940, "total_steps": 7064, "loss": 0.8131, "reward": null, "learning_rate": 3.1506267247777645e-05, "epoch": 0.83, "percentage": 41.62, "elapsed_time": "7:56:32", "remaining_time": "11:08:27"} +{"current_steps": 2950, "total_steps": 7064, "loss": 0.8015, "reward": null, "learning_rate": 3.139885130656563e-05, "epoch": 0.84, "percentage": 41.76, "elapsed_time": "7:54:17", "remaining_time": "11:01:26"} +{"current_steps": 2950, "total_steps": 7064, "loss": 0.8015, "reward": null, "learning_rate": 3.139885130656563e-05, "epoch": 0.84, "percentage": 41.76, "elapsed_time": "7:54:16", "remaining_time": "11:01:24"} +{"current_steps": 2950, "total_steps": 7064, "loss": 0.8015, "reward": null, "learning_rate": 3.139885130656563e-05, "epoch": 0.84, "percentage": 41.76, "elapsed_time": "7:58:11", "remaining_time": "11:06:52"} +{"current_steps": 2950, "total_steps": 7064, "loss": 0.8015, "reward": null, "learning_rate": 3.139885130656563e-05, "epoch": 0.84, "percentage": 41.76, "elapsed_time": "7:54:18", "remaining_time": "11:01:27"} +{"current_steps": 2960, "total_steps": 7064, "loss": 0.8053, "reward": null, "learning_rate": 3.129130880442091e-05, "epoch": 0.84, "percentage": 41.9, "elapsed_time": "7:55:58", "remaining_time": "10:59:56"} +{"current_steps": 2960, "total_steps": 7064, "loss": 0.8053, "reward": null, "learning_rate": 3.129130880442091e-05, "epoch": 0.84, "percentage": 41.9, "elapsed_time": "7:59:52", "remaining_time": "11:05:20"} +{"current_steps": 2960, "total_steps": 7064, "loss": 0.8053, "reward": null, "learning_rate": 3.129130880442091e-05, "epoch": 0.84, "percentage": 41.9, "elapsed_time": "7:55:57", "remaining_time": "10:59:55"} +{"current_steps": 2960, "total_steps": 7064, "loss": 0.8053, "reward": null, "learning_rate": 3.129130880442091e-05, "epoch": 0.84, "percentage": 41.9, "elapsed_time": "7:55:59", "remaining_time": "10:59:57"} +{"current_steps": 2970, "total_steps": 7064, "loss": 0.7986, "reward": null, "learning_rate": 3.118364186839389e-05, "epoch": 0.84, "percentage": 42.04, "elapsed_time": "7:57:37", "remaining_time": "10:58:23"} +{"current_steps": 2970, "total_steps": 7064, "loss": 0.7986, "reward": null, "learning_rate": 3.118364186839389e-05, "epoch": 0.84, "percentage": 42.04, "elapsed_time": "7:57:38", "remaining_time": "10:58:24"} +{"current_steps": 2970, "total_steps": 7064, "loss": 0.7986, "reward": null, "learning_rate": 3.118364186839389e-05, "epoch": 0.84, "percentage": 42.04, "elapsed_time": "7:57:36", "remaining_time": "10:58:21"} +{"current_steps": 2970, "total_steps": 7064, "loss": 0.7986, "reward": null, "learning_rate": 3.118364186839389e-05, "epoch": 0.84, "percentage": 42.04, "elapsed_time": "8:01:31", "remaining_time": "11:03:45"} +{"current_steps": 2980, "total_steps": 7064, "loss": 0.7936, "reward": null, "learning_rate": 3.107585262799613e-05, "epoch": 0.84, "percentage": 42.19, "elapsed_time": "8:03:10", "remaining_time": "11:02:10"} +{"current_steps": 2980, "total_steps": 7064, "loss": 0.7936, "reward": null, "learning_rate": 3.107585262799613e-05, "epoch": 0.84, "percentage": 42.19, "elapsed_time": "7:59:16", "remaining_time": "10:56:49"} +{"current_steps": 2980, "total_steps": 7064, "loss": 0.7936, "reward": null, "learning_rate": 3.107585262799613e-05, "epoch": 0.84, "percentage": 42.19, "elapsed_time": "7:59:15", "remaining_time": "10:56:48"} +{"current_steps": 2980, "total_steps": 7064, "loss": 0.7936, "reward": null, "learning_rate": 3.107585262799613e-05, "epoch": 0.84, "percentage": 42.19, "elapsed_time": "7:59:17", "remaining_time": "10:56:50"} +{"current_steps": 2990, "total_steps": 7064, "loss": 0.8235, "reward": null, "learning_rate": 3.096794321515823e-05, "epoch": 0.85, "percentage": 42.33, "elapsed_time": "8:00:54", "remaining_time": "10:55:15"} +{"current_steps": 2990, "total_steps": 7064, "loss": 0.8235, "reward": null, "learning_rate": 3.096794321515823e-05, "epoch": 0.85, "percentage": 42.33, "elapsed_time": "8:00:55", "remaining_time": "10:55:16"} +{"current_steps": 2990, "total_steps": 7064, "loss": 0.8235, "reward": null, "learning_rate": 3.096794321515823e-05, "epoch": 0.85, "percentage": 42.33, "elapsed_time": "8:00:53", "remaining_time": "10:55:14"} +{"current_steps": 2990, "total_steps": 7064, "loss": 0.8235, "reward": null, "learning_rate": 3.096794321515823e-05, "epoch": 0.85, "percentage": 42.33, "elapsed_time": "8:04:48", "remaining_time": "11:00:34"} +{"current_steps": 3000, "total_steps": 7064, "loss": 0.8083, "reward": null, "learning_rate": 3.0859915764187616e-05, "epoch": 0.85, "percentage": 42.47, "elapsed_time": "8:02:35", "remaining_time": "10:53:45"} +{"current_steps": 3000, "total_steps": 7064, "loss": 0.8083, "reward": null, "learning_rate": 3.0859915764187616e-05, "epoch": 0.85, "percentage": 42.47, "elapsed_time": "8:06:28", "remaining_time": "10:59:00"} +{"current_steps": 3000, "total_steps": 7064, "loss": 0.8083, "reward": null, "learning_rate": 3.0859915764187616e-05, "epoch": 0.85, "percentage": 42.47, "elapsed_time": "8:02:34", "remaining_time": "10:53:43"} +{"current_steps": 3000, "total_steps": 7064, "loss": 0.8083, "reward": null, "learning_rate": 3.0859915764187616e-05, "epoch": 0.85, "percentage": 42.47, "elapsed_time": "8:02:34", "remaining_time": "10:53:44"} +{"current_steps": 3010, "total_steps": 7064, "loss": 0.8081, "reward": null, "learning_rate": 3.075177241172637e-05, "epoch": 0.85, "percentage": 42.61, "elapsed_time": "8:04:09", "remaining_time": "10:52:05"} +{"current_steps": 3010, "total_steps": 7064, "loss": 0.8081, "reward": null, "learning_rate": 3.075177241172637e-05, "epoch": 0.85, "percentage": 42.61, "elapsed_time": "8:08:02", "remaining_time": "10:57:19"} +{"current_steps": 3010, "total_steps": 7064, "loss": 0.8081, "reward": null, "learning_rate": 3.075177241172637e-05, "epoch": 0.85, "percentage": 42.61, "elapsed_time": "8:04:08", "remaining_time": "10:52:03"} +{"current_steps": 3010, "total_steps": 7064, "loss": 0.8081, "reward": null, "learning_rate": 3.075177241172637e-05, "epoch": 0.85, "percentage": 42.61, "elapsed_time": "8:04:09", "remaining_time": "10:52:04"} +{"current_steps": 3020, "total_steps": 7064, "loss": 0.7981, "reward": null, "learning_rate": 3.064351529670895e-05, "epoch": 0.86, "percentage": 42.75, "elapsed_time": "8:09:37", "remaining_time": "10:55:38"} +{"current_steps": 3020, "total_steps": 7064, "loss": 0.7981, "reward": null, "learning_rate": 3.064351529670895e-05, "epoch": 0.86, "percentage": 42.75, "elapsed_time": "8:05:43", "remaining_time": "10:50:25"} +{"current_steps": 3020, "total_steps": 7064, "loss": 0.7981, "reward": null, "learning_rate": 3.064351529670895e-05, "epoch": 0.86, "percentage": 42.75, "elapsed_time": "8:05:42", "remaining_time": "10:50:24"} +{"current_steps": 3020, "total_steps": 7064, "loss": 0.7981, "reward": null, "learning_rate": 3.064351529670895e-05, "epoch": 0.86, "percentage": 42.75, "elapsed_time": "8:05:44", "remaining_time": "10:50:26"} +{"current_steps": 3030, "total_steps": 7064, "loss": 0.8152, "reward": null, "learning_rate": 3.0535146560319895e-05, "epoch": 0.86, "percentage": 42.89, "elapsed_time": "8:11:12", "remaining_time": "10:53:57"} +{"current_steps": 3030, "total_steps": 7064, "loss": 0.8152, "reward": null, "learning_rate": 3.0535146560319895e-05, "epoch": 0.86, "percentage": 42.89, "elapsed_time": "8:07:17", "remaining_time": "10:48:45"} +{"current_steps": 3030, "total_steps": 7064, "loss": 0.8152, "reward": null, "learning_rate": 3.0535146560319895e-05, "epoch": 0.86, "percentage": 42.89, "elapsed_time": "8:07:19", "remaining_time": "10:48:47"} +{"current_steps": 3030, "total_steps": 7064, "loss": 0.8152, "reward": null, "learning_rate": 3.0535146560319895e-05, "epoch": 0.86, "percentage": 42.89, "elapsed_time": "8:07:18", "remaining_time": "10:48:46"} +{"current_steps": 3040, "total_steps": 7064, "loss": 0.8091, "reward": null, "learning_rate": 3.0426668345951448e-05, "epoch": 0.86, "percentage": 43.04, "elapsed_time": "8:08:53", "remaining_time": "10:47:08"} +{"current_steps": 3040, "total_steps": 7064, "loss": 0.8091, "reward": null, "learning_rate": 3.0426668345951448e-05, "epoch": 0.86, "percentage": 43.04, "elapsed_time": "8:12:47", "remaining_time": "10:52:17"} +{"current_steps": 3040, "total_steps": 7064, "loss": 0.8091, "reward": null, "learning_rate": 3.0426668345951448e-05, "epoch": 0.86, "percentage": 43.04, "elapsed_time": "8:08:52", "remaining_time": "10:47:07"} +{"current_steps": 3040, "total_steps": 7064, "loss": 0.8091, "reward": null, "learning_rate": 3.0426668345951448e-05, "epoch": 0.86, "percentage": 43.04, "elapsed_time": "8:08:54", "remaining_time": "10:47:09"} +{"current_steps": 3050, "total_steps": 7064, "loss": 0.8206, "reward": null, "learning_rate": 3.031808279916121e-05, "epoch": 0.86, "percentage": 43.18, "elapsed_time": "8:10:28", "remaining_time": "10:45:29"} +{"current_steps": 3050, "total_steps": 7064, "loss": 0.8206, "reward": null, "learning_rate": 3.031808279916121e-05, "epoch": 0.86, "percentage": 43.18, "elapsed_time": "8:10:29", "remaining_time": "10:45:30"} +{"current_steps": 3050, "total_steps": 7064, "loss": 0.8206, "reward": null, "learning_rate": 3.031808279916121e-05, "epoch": 0.86, "percentage": 43.18, "elapsed_time": "8:10:27", "remaining_time": "10:45:28"} +{"current_steps": 3050, "total_steps": 7064, "loss": 0.8206, "reward": null, "learning_rate": 3.031808279916121e-05, "epoch": 0.86, "percentage": 43.18, "elapsed_time": "8:14:22", "remaining_time": "10:50:37"} +{"current_steps": 3060, "total_steps": 7064, "loss": 0.7947, "reward": null, "learning_rate": 3.0209392067629676e-05, "epoch": 0.87, "percentage": 43.32, "elapsed_time": "8:12:08", "remaining_time": "10:43:58"} +{"current_steps": 3060, "total_steps": 7064, "loss": 0.7947, "reward": null, "learning_rate": 3.0209392067629676e-05, "epoch": 0.87, "percentage": 43.32, "elapsed_time": "8:16:02", "remaining_time": "10:49:03"} +{"current_steps": 3060, "total_steps": 7064, "loss": 0.7947, "reward": null, "learning_rate": 3.0209392067629676e-05, "epoch": 0.87, "percentage": 43.32, "elapsed_time": "8:12:09", "remaining_time": "10:43:59"} +{"current_steps": 3060, "total_steps": 7064, "loss": 0.7947, "reward": null, "learning_rate": 3.0209392067629676e-05, "epoch": 0.87, "percentage": 43.32, "elapsed_time": "8:12:07", "remaining_time": "10:43:56"} +{"current_steps": 3070, "total_steps": 7064, "loss": 0.8116, "reward": null, "learning_rate": 3.010059830111773e-05, "epoch": 0.87, "percentage": 43.46, "elapsed_time": "8:13:47", "remaining_time": "10:42:24"} +{"current_steps": 3070, "total_steps": 7064, "loss": 0.8116, "reward": null, "learning_rate": 3.010059830111773e-05, "epoch": 0.87, "percentage": 43.46, "elapsed_time": "8:17:41", "remaining_time": "10:47:28"} +{"current_steps": 3070, "total_steps": 7064, "loss": 0.8116, "reward": null, "learning_rate": 3.010059830111773e-05, "epoch": 0.87, "percentage": 43.46, "elapsed_time": "8:13:48", "remaining_time": "10:42:25"} +{"current_steps": 3070, "total_steps": 7064, "loss": 0.8116, "reward": null, "learning_rate": 3.010059830111773e-05, "epoch": 0.87, "percentage": 43.46, "elapsed_time": "8:13:46", "remaining_time": "10:42:23"} +{"current_steps": 3080, "total_steps": 7064, "loss": 0.8135, "reward": null, "learning_rate": 2.9991703651424184e-05, "epoch": 0.87, "percentage": 43.6, "elapsed_time": "8:19:19", "remaining_time": "10:45:52"} +{"current_steps": 3080, "total_steps": 7064, "loss": 0.8135, "reward": null, "learning_rate": 2.9991703651424184e-05, "epoch": 0.87, "percentage": 43.6, "elapsed_time": "8:15:26", "remaining_time": "10:40:51"} +{"current_steps": 3080, "total_steps": 7064, "loss": 0.8135, "reward": null, "learning_rate": 2.9991703651424184e-05, "epoch": 0.87, "percentage": 43.6, "elapsed_time": "8:15:24", "remaining_time": "10:40:49"} +{"current_steps": 3080, "total_steps": 7064, "loss": 0.8135, "reward": null, "learning_rate": 2.9991703651424184e-05, "epoch": 0.87, "percentage": 43.6, "elapsed_time": "8:15:25", "remaining_time": "10:40:50"} +{"current_steps": 3090, "total_steps": 7064, "loss": 0.8032, "reward": null, "learning_rate": 2.988271027234317e-05, "epoch": 0.87, "percentage": 43.74, "elapsed_time": "8:17:02", "remaining_time": "10:39:14"} +{"current_steps": 3090, "total_steps": 7064, "loss": 0.8032, "reward": null, "learning_rate": 2.988271027234317e-05, "epoch": 0.87, "percentage": 43.74, "elapsed_time": "8:17:01", "remaining_time": "10:39:12"} +{"current_steps": 3090, "total_steps": 7064, "loss": 0.8032, "reward": null, "learning_rate": 2.988271027234317e-05, "epoch": 0.87, "percentage": 43.74, "elapsed_time": "8:17:03", "remaining_time": "10:39:15"} +{"current_steps": 3090, "total_steps": 7064, "loss": 0.8032, "reward": null, "learning_rate": 2.988271027234317e-05, "epoch": 0.87, "percentage": 43.74, "elapsed_time": "8:20:56", "remaining_time": "10:44:14"} +{"current_steps": 3100, "total_steps": 7064, "loss": 0.8023, "reward": null, "learning_rate": 2.977362031962158e-05, "epoch": 0.88, "percentage": 43.88, "elapsed_time": "8:22:32", "remaining_time": "10:42:36"} +{"current_steps": 3100, "total_steps": 7064, "loss": 0.8023, "reward": null, "learning_rate": 2.977362031962158e-05, "epoch": 0.88, "percentage": 43.88, "elapsed_time": "8:18:38", "remaining_time": "10:37:36"} +{"current_steps": 3100, "total_steps": 7064, "loss": 0.8023, "reward": null, "learning_rate": 2.977362031962158e-05, "epoch": 0.88, "percentage": 43.88, "elapsed_time": "8:18:39", "remaining_time": "10:37:37"} +{"current_steps": 3100, "total_steps": 7064, "loss": 0.8023, "reward": null, "learning_rate": 2.977362031962158e-05, "epoch": 0.88, "percentage": 43.88, "elapsed_time": "8:18:39", "remaining_time": "10:37:38"} +{"current_steps": 3110, "total_steps": 7064, "loss": 0.8116, "reward": null, "learning_rate": 2.966443595091637e-05, "epoch": 0.88, "percentage": 44.03, "elapsed_time": "8:20:18", "remaining_time": "10:36:05"} +{"current_steps": 3110, "total_steps": 7064, "loss": 0.8116, "reward": null, "learning_rate": 2.966443595091637e-05, "epoch": 0.88, "percentage": 44.03, "elapsed_time": "8:24:12", "remaining_time": "10:41:02"} +{"current_steps": 3110, "total_steps": 7064, "loss": 0.8116, "reward": null, "learning_rate": 2.966443595091637e-05, "epoch": 0.88, "percentage": 44.03, "elapsed_time": "8:20:19", "remaining_time": "10:36:06"} +{"current_steps": 3110, "total_steps": 7064, "loss": 0.8116, "reward": null, "learning_rate": 2.966443595091637e-05, "epoch": 0.88, "percentage": 44.03, "elapsed_time": "8:20:17", "remaining_time": "10:36:04"} +{"current_steps": 3120, "total_steps": 7064, "loss": 0.8048, "reward": null, "learning_rate": 2.9555159325751947e-05, "epoch": 0.88, "percentage": 44.17, "elapsed_time": "8:21:54", "remaining_time": "10:34:27"} +{"current_steps": 3120, "total_steps": 7064, "loss": 0.8048, "reward": null, "learning_rate": 2.9555159325751947e-05, "epoch": 0.88, "percentage": 44.17, "elapsed_time": "8:25:49", "remaining_time": "10:39:24"} +{"current_steps": 3120, "total_steps": 7064, "loss": 0.8048, "reward": null, "learning_rate": 2.9555159325751947e-05, "epoch": 0.88, "percentage": 44.17, "elapsed_time": "8:21:56", "remaining_time": "10:34:29"} +{"current_steps": 3120, "total_steps": 7064, "loss": 0.8048, "reward": null, "learning_rate": 2.9555159325751947e-05, "epoch": 0.88, "percentage": 44.17, "elapsed_time": "8:21:55", "remaining_time": "10:34:28"} +{"current_steps": 3130, "total_steps": 7064, "loss": 0.8032, "reward": null, "learning_rate": 2.9445792605477433e-05, "epoch": 0.89, "percentage": 44.31, "elapsed_time": "8:23:33", "remaining_time": "10:32:54"} +{"current_steps": 3130, "total_steps": 7064, "loss": 0.8032, "reward": null, "learning_rate": 2.9445792605477433e-05, "epoch": 0.89, "percentage": 44.31, "elapsed_time": "8:27:26", "remaining_time": "10:37:46"} +{"current_steps": 3130, "total_steps": 7064, "loss": 0.8032, "reward": null, "learning_rate": 2.9445792605477433e-05, "epoch": 0.89, "percentage": 44.31, "elapsed_time": "8:23:31", "remaining_time": "10:32:52"} +{"current_steps": 3130, "total_steps": 7064, "loss": 0.8032, "reward": null, "learning_rate": 2.9445792605477433e-05, "epoch": 0.89, "percentage": 44.31, "elapsed_time": "8:23:32", "remaining_time": "10:32:53"} +{"current_steps": 3140, "total_steps": 7064, "loss": 0.808, "reward": null, "learning_rate": 2.933633795322391e-05, "epoch": 0.89, "percentage": 44.45, "elapsed_time": "8:25:11", "remaining_time": "10:31:19"} +{"current_steps": 3140, "total_steps": 7064, "loss": 0.808, "reward": null, "learning_rate": 2.933633795322391e-05, "epoch": 0.89, "percentage": 44.45, "elapsed_time": "8:25:09", "remaining_time": "10:31:17"} +{"current_steps": 3140, "total_steps": 7064, "loss": 0.808, "reward": null, "learning_rate": 2.933633795322391e-05, "epoch": 0.89, "percentage": 44.45, "elapsed_time": "8:25:10", "remaining_time": "10:31:18"} +{"current_steps": 3140, "total_steps": 7064, "loss": 0.808, "reward": null, "learning_rate": 2.933633795322391e-05, "epoch": 0.89, "percentage": 44.45, "elapsed_time": "8:29:03", "remaining_time": "10:36:10"} +{"current_steps": 3150, "total_steps": 7064, "loss": 0.8057, "reward": null, "learning_rate": 2.9226797533861615e-05, "epoch": 0.89, "percentage": 44.59, "elapsed_time": "8:26:46", "remaining_time": "10:29:41"} +{"current_steps": 3150, "total_steps": 7064, "loss": 0.8057, "reward": null, "learning_rate": 2.9226797533861615e-05, "epoch": 0.89, "percentage": 44.59, "elapsed_time": "8:30:40", "remaining_time": "10:34:32"} +{"current_steps": 3150, "total_steps": 7064, "loss": 0.8057, "reward": null, "learning_rate": 2.9226797533861615e-05, "epoch": 0.89, "percentage": 44.59, "elapsed_time": "8:26:47", "remaining_time": "10:29:42"} +{"current_steps": 3150, "total_steps": 7064, "loss": 0.8057, "reward": null, "learning_rate": 2.9226797533861615e-05, "epoch": 0.89, "percentage": 44.59, "elapsed_time": "8:26:46", "remaining_time": "10:29:40"} +{"current_steps": 3160, "total_steps": 7064, "loss": 0.8013, "reward": null, "learning_rate": 2.9117173513957186e-05, "epoch": 0.89, "percentage": 44.73, "elapsed_time": "8:28:25", "remaining_time": "10:28:08"} +{"current_steps": 3160, "total_steps": 7064, "loss": 0.8013, "reward": null, "learning_rate": 2.9117173513957186e-05, "epoch": 0.89, "percentage": 44.73, "elapsed_time": "8:32:19", "remaining_time": "10:32:56"} +{"current_steps": 3160, "total_steps": 7064, "loss": 0.8013, "reward": null, "learning_rate": 2.9117173513957186e-05, "epoch": 0.89, "percentage": 44.73, "elapsed_time": "8:28:24", "remaining_time": "10:28:07"} +{"current_steps": 3160, "total_steps": 7064, "loss": 0.8013, "reward": null, "learning_rate": 2.9117173513957186e-05, "epoch": 0.89, "percentage": 44.73, "elapsed_time": "8:28:26", "remaining_time": "10:28:09"} +{"current_steps": 3170, "total_steps": 7064, "loss": 0.802, "reward": null, "learning_rate": 2.900746806173074e-05, "epoch": 0.9, "percentage": 44.88, "elapsed_time": "8:30:03", "remaining_time": "10:26:33"} +{"current_steps": 3170, "total_steps": 7064, "loss": 0.802, "reward": null, "learning_rate": 2.900746806173074e-05, "epoch": 0.9, "percentage": 44.88, "elapsed_time": "8:30:02", "remaining_time": "10:26:32"} +{"current_steps": 3170, "total_steps": 7064, "loss": 0.802, "reward": null, "learning_rate": 2.900746806173074e-05, "epoch": 0.9, "percentage": 44.88, "elapsed_time": "8:30:04", "remaining_time": "10:26:34"} +{"current_steps": 3170, "total_steps": 7064, "loss": 0.802, "reward": null, "learning_rate": 2.900746806173074e-05, "epoch": 0.9, "percentage": 44.88, "elapsed_time": "8:33:57", "remaining_time": "10:31:20"} +{"current_steps": 3180, "total_steps": 7064, "loss": 0.804, "reward": null, "learning_rate": 2.889768334701305e-05, "epoch": 0.9, "percentage": 45.02, "elapsed_time": "8:35:38", "remaining_time": "10:29:47"} +{"current_steps": 3180, "total_steps": 7064, "loss": 0.804, "reward": null, "learning_rate": 2.889768334701305e-05, "epoch": 0.9, "percentage": 45.02, "elapsed_time": "8:31:44", "remaining_time": "10:25:02"} +{"current_steps": 3180, "total_steps": 7064, "loss": 0.804, "reward": null, "learning_rate": 2.889768334701305e-05, "epoch": 0.9, "percentage": 45.02, "elapsed_time": "8:31:45", "remaining_time": "10:25:03"} +{"current_steps": 3180, "total_steps": 7064, "loss": 0.804, "reward": null, "learning_rate": 2.889768334701305e-05, "epoch": 0.9, "percentage": 45.02, "elapsed_time": "8:31:43", "remaining_time": "10:25:01"} +{"current_steps": 3190, "total_steps": 7064, "loss": 0.8, "reward": null, "learning_rate": 2.8787821541202564e-05, "epoch": 0.9, "percentage": 45.16, "elapsed_time": "8:33:22", "remaining_time": "10:23:26"} +{"current_steps": 3190, "total_steps": 7064, "loss": 0.8, "reward": null, "learning_rate": 2.8787821541202564e-05, "epoch": 0.9, "percentage": 45.16, "elapsed_time": "8:37:15", "remaining_time": "10:28:10"} +{"current_steps": 3190, "total_steps": 7064, "loss": 0.8, "reward": null, "learning_rate": 2.8787821541202564e-05, "epoch": 0.9, "percentage": 45.16, "elapsed_time": "8:33:23", "remaining_time": "10:23:27"} +{"current_steps": 3190, "total_steps": 7064, "loss": 0.8, "reward": null, "learning_rate": 2.8787821541202564e-05, "epoch": 0.9, "percentage": 45.16, "elapsed_time": "8:33:21", "remaining_time": "10:23:25"} +{"current_steps": 3200, "total_steps": 7064, "loss": 0.7983, "reward": null, "learning_rate": 2.8677884817222505e-05, "epoch": 0.91, "percentage": 45.3, "elapsed_time": "8:34:56", "remaining_time": "10:21:47"} +{"current_steps": 3200, "total_steps": 7064, "loss": 0.7983, "reward": null, "learning_rate": 2.8677884817222505e-05, "epoch": 0.91, "percentage": 45.3, "elapsed_time": "8:38:49", "remaining_time": "10:26:29"} +{"current_steps": 3200, "total_steps": 7064, "loss": 0.7983, "reward": null, "learning_rate": 2.8677884817222505e-05, "epoch": 0.91, "percentage": 45.3, "elapsed_time": "8:34:55", "remaining_time": "10:21:45"} +{"current_steps": 3200, "total_steps": 7064, "loss": 0.7983, "reward": null, "learning_rate": 2.8677884817222505e-05, "epoch": 0.91, "percentage": 45.3, "elapsed_time": "8:34:56", "remaining_time": "10:21:46"} +{"current_steps": 3210, "total_steps": 7064, "loss": 0.8083, "reward": null, "learning_rate": 2.856787534947789e-05, "epoch": 0.91, "percentage": 45.44, "elapsed_time": "8:40:27", "remaining_time": "10:24:52"} +{"current_steps": 3210, "total_steps": 7064, "loss": 0.8083, "reward": null, "learning_rate": 2.856787534947789e-05, "epoch": 0.91, "percentage": 45.44, "elapsed_time": "8:36:33", "remaining_time": "10:20:11"} +{"current_steps": 3210, "total_steps": 7064, "loss": 0.8083, "reward": null, "learning_rate": 2.856787534947789e-05, "epoch": 0.91, "percentage": 45.44, "elapsed_time": "8:36:32", "remaining_time": "10:20:10"} +{"current_steps": 3210, "total_steps": 7064, "loss": 0.8083, "reward": null, "learning_rate": 2.856787534947789e-05, "epoch": 0.91, "percentage": 45.44, "elapsed_time": "8:36:34", "remaining_time": "10:20:12"} +{"current_steps": 3220, "total_steps": 7064, "loss": 0.8203, "reward": null, "learning_rate": 2.8457795313812507e-05, "epoch": 0.91, "percentage": 45.58, "elapsed_time": "8:38:12", "remaining_time": "10:18:37"} +{"current_steps": 3220, "total_steps": 7064, "loss": 0.8203, "reward": null, "learning_rate": 2.8457795313812507e-05, "epoch": 0.91, "percentage": 45.58, "elapsed_time": "8:38:11", "remaining_time": "10:18:36"} +{"current_steps": 3220, "total_steps": 7064, "loss": 0.8203, "reward": null, "learning_rate": 2.8457795313812507e-05, "epoch": 0.91, "percentage": 45.58, "elapsed_time": "8:38:12", "remaining_time": "10:18:38"} +{"current_steps": 3220, "total_steps": 7064, "loss": 0.8203, "reward": null, "learning_rate": 2.8457795313812507e-05, "epoch": 0.91, "percentage": 45.58, "elapsed_time": "8:42:05", "remaining_time": "10:23:16"} +{"current_steps": 3230, "total_steps": 7064, "loss": 0.792, "reward": null, "learning_rate": 2.8347646887465867e-05, "epoch": 0.91, "percentage": 45.72, "elapsed_time": "8:39:48", "remaining_time": "10:17:00"} +{"current_steps": 3230, "total_steps": 7064, "loss": 0.792, "reward": null, "learning_rate": 2.8347646887465867e-05, "epoch": 0.91, "percentage": 45.72, "elapsed_time": "8:39:49", "remaining_time": "10:17:01"} +{"current_steps": 3230, "total_steps": 7064, "loss": 0.792, "reward": null, "learning_rate": 2.8347646887465867e-05, "epoch": 0.91, "percentage": 45.72, "elapsed_time": "8:39:50", "remaining_time": "10:17:02"} +{"current_steps": 3230, "total_steps": 7064, "loss": 0.792, "reward": null, "learning_rate": 2.8347646887465867e-05, "epoch": 0.91, "percentage": 45.72, "elapsed_time": "8:43:43", "remaining_time": "10:21:39"} +{"current_steps": 3240, "total_steps": 7064, "loss": 0.8006, "reward": null, "learning_rate": 2.8237432249030183e-05, "epoch": 0.92, "percentage": 45.87, "elapsed_time": "8:41:27", "remaining_time": "10:15:26"} +{"current_steps": 3240, "total_steps": 7064, "loss": 0.8006, "reward": null, "learning_rate": 2.8237432249030183e-05, "epoch": 0.92, "percentage": 45.87, "elapsed_time": "8:41:27", "remaining_time": "10:15:27"} +{"current_steps": 3240, "total_steps": 7064, "loss": 0.8006, "reward": null, "learning_rate": 2.8237432249030183e-05, "epoch": 0.92, "percentage": 45.87, "elapsed_time": "8:45:20", "remaining_time": "10:20:02"} +{"current_steps": 3240, "total_steps": 7064, "loss": 0.8006, "reward": null, "learning_rate": 2.8237432249030183e-05, "epoch": 0.92, "percentage": 45.87, "elapsed_time": "8:41:26", "remaining_time": "10:15:25"} +{"current_steps": 3250, "total_steps": 7064, "loss": 0.7953, "reward": null, "learning_rate": 2.812715357840725e-05, "epoch": 0.92, "percentage": 46.01, "elapsed_time": "8:46:59", "remaining_time": "10:18:26"} +{"current_steps": 3250, "total_steps": 7064, "loss": 0.7953, "reward": null, "learning_rate": 2.812715357840725e-05, "epoch": 0.92, "percentage": 46.01, "elapsed_time": "8:43:06", "remaining_time": "10:13:52"} +{"current_steps": 3250, "total_steps": 7064, "loss": 0.7953, "reward": null, "learning_rate": 2.812715357840725e-05, "epoch": 0.92, "percentage": 46.01, "elapsed_time": "8:43:05", "remaining_time": "10:13:51"} +{"current_steps": 3250, "total_steps": 7064, "loss": 0.7953, "reward": null, "learning_rate": 2.812715357840725e-05, "epoch": 0.92, "percentage": 46.01, "elapsed_time": "8:43:06", "remaining_time": "10:13:53"} +{"current_steps": 3260, "total_steps": 7064, "loss": 0.8057, "reward": null, "learning_rate": 2.801681305676534e-05, "epoch": 0.92, "percentage": 46.15, "elapsed_time": "8:44:46", "remaining_time": "10:12:20"} +{"current_steps": 3260, "total_steps": 7064, "loss": 0.8057, "reward": null, "learning_rate": 2.801681305676534e-05, "epoch": 0.92, "percentage": 46.15, "elapsed_time": "8:44:47", "remaining_time": "10:12:21"} +{"current_steps": 3260, "total_steps": 7064, "loss": 0.8057, "reward": null, "learning_rate": 2.801681305676534e-05, "epoch": 0.92, "percentage": 46.15, "elapsed_time": "8:44:45", "remaining_time": "10:12:19"} +{"current_steps": 3260, "total_steps": 7064, "loss": 0.8057, "reward": null, "learning_rate": 2.801681305676534e-05, "epoch": 0.92, "percentage": 46.15, "elapsed_time": "8:48:39", "remaining_time": "10:16:53"} +{"current_steps": 3270, "total_steps": 7064, "loss": 0.8005, "reward": null, "learning_rate": 2.7906412866496034e-05, "epoch": 0.93, "percentage": 46.29, "elapsed_time": "8:50:19", "remaining_time": "10:15:18"} +{"current_steps": 3270, "total_steps": 7064, "loss": 0.8005, "reward": null, "learning_rate": 2.7906412866496034e-05, "epoch": 0.93, "percentage": 46.29, "elapsed_time": "8:46:25", "remaining_time": "10:10:47"} +{"current_steps": 3270, "total_steps": 7064, "loss": 0.8005, "reward": null, "learning_rate": 2.7906412866496034e-05, "epoch": 0.93, "percentage": 46.29, "elapsed_time": "8:46:26", "remaining_time": "10:10:48"} +{"current_steps": 3270, "total_steps": 7064, "loss": 0.8005, "reward": null, "learning_rate": 2.7906412866496034e-05, "epoch": 0.93, "percentage": 46.29, "elapsed_time": "8:46:25", "remaining_time": "10:10:46"} +{"current_steps": 3280, "total_steps": 7064, "loss": 0.8082, "reward": null, "learning_rate": 2.7795955191171114e-05, "epoch": 0.93, "percentage": 46.43, "elapsed_time": "8:51:58", "remaining_time": "10:13:43"} +{"current_steps": 3280, "total_steps": 7064, "loss": 0.8082, "reward": null, "learning_rate": 2.7795955191171114e-05, "epoch": 0.93, "percentage": 46.43, "elapsed_time": "8:48:04", "remaining_time": "10:09:12"} +{"current_steps": 3280, "total_steps": 7064, "loss": 0.8082, "reward": null, "learning_rate": 2.7795955191171114e-05, "epoch": 0.93, "percentage": 46.43, "elapsed_time": "8:48:05", "remaining_time": "10:09:14"} +{"current_steps": 3280, "total_steps": 7064, "loss": 0.8082, "reward": null, "learning_rate": 2.7795955191171114e-05, "epoch": 0.93, "percentage": 46.43, "elapsed_time": "8:48:05", "remaining_time": "10:09:13"} +{"current_steps": 3290, "total_steps": 7064, "loss": 0.811, "reward": null, "learning_rate": 2.7685442215499323e-05, "epoch": 0.93, "percentage": 46.57, "elapsed_time": "8:53:35", "remaining_time": "10:12:05"} +{"current_steps": 3290, "total_steps": 7064, "loss": 0.811, "reward": null, "learning_rate": 2.7685442215499323e-05, "epoch": 0.93, "percentage": 46.57, "elapsed_time": "8:49:40", "remaining_time": "10:07:36"} +{"current_steps": 3290, "total_steps": 7064, "loss": 0.811, "reward": null, "learning_rate": 2.7685442215499323e-05, "epoch": 0.93, "percentage": 46.57, "elapsed_time": "8:49:42", "remaining_time": "10:07:38"} +{"current_steps": 3290, "total_steps": 7064, "loss": 0.811, "reward": null, "learning_rate": 2.7685442215499323e-05, "epoch": 0.93, "percentage": 46.57, "elapsed_time": "8:49:41", "remaining_time": "10:07:37"} +{"current_steps": 3300, "total_steps": 7064, "loss": 0.7981, "reward": null, "learning_rate": 2.7574876125283176e-05, "epoch": 0.93, "percentage": 46.72, "elapsed_time": "8:55:15", "remaining_time": "10:10:30"} +{"current_steps": 3300, "total_steps": 7064, "loss": 0.7981, "reward": null, "learning_rate": 2.7574876125283176e-05, "epoch": 0.93, "percentage": 46.72, "elapsed_time": "8:51:21", "remaining_time": "10:06:04"} +{"current_steps": 3300, "total_steps": 7064, "loss": 0.7981, "reward": null, "learning_rate": 2.7574876125283176e-05, "epoch": 0.93, "percentage": 46.72, "elapsed_time": "8:51:20", "remaining_time": "10:06:03"} +{"current_steps": 3300, "total_steps": 7064, "loss": 0.7981, "reward": null, "learning_rate": 2.7574876125283176e-05, "epoch": 0.93, "percentage": 46.72, "elapsed_time": "8:51:22", "remaining_time": "10:06:04"} +{"current_steps": 3310, "total_steps": 7064, "loss": 0.8018, "reward": null, "learning_rate": 2.7464259107375722e-05, "epoch": 0.94, "percentage": 46.86, "elapsed_time": "8:56:50", "remaining_time": "10:08:51"} +{"current_steps": 3310, "total_steps": 7064, "loss": 0.8018, "reward": null, "learning_rate": 2.7464259107375722e-05, "epoch": 0.94, "percentage": 46.86, "elapsed_time": "8:52:57", "remaining_time": "10:04:27"} +{"current_steps": 3310, "total_steps": 7064, "loss": 0.8018, "reward": null, "learning_rate": 2.7464259107375722e-05, "epoch": 0.94, "percentage": 46.86, "elapsed_time": "8:52:56", "remaining_time": "10:04:25"} +{"current_steps": 3310, "total_steps": 7064, "loss": 0.8018, "reward": null, "learning_rate": 2.7464259107375722e-05, "epoch": 0.94, "percentage": 46.86, "elapsed_time": "8:52:57", "remaining_time": "10:04:26"} +{"current_steps": 3320, "total_steps": 7064, "loss": 0.7991, "reward": null, "learning_rate": 2.7353593349637297e-05, "epoch": 0.94, "percentage": 47.0, "elapsed_time": "8:58:31", "remaining_time": "10:07:17"} +{"current_steps": 3320, "total_steps": 7064, "loss": 0.7991, "reward": null, "learning_rate": 2.7353593349637297e-05, "epoch": 0.94, "percentage": 47.0, "elapsed_time": "8:54:37", "remaining_time": "10:02:54"} +{"current_steps": 3320, "total_steps": 7064, "loss": 0.7991, "reward": null, "learning_rate": 2.7353593349637297e-05, "epoch": 0.94, "percentage": 47.0, "elapsed_time": "8:54:38", "remaining_time": "10:02:55"} +{"current_steps": 3320, "total_steps": 7064, "loss": 0.7991, "reward": null, "learning_rate": 2.7353593349637297e-05, "epoch": 0.94, "percentage": 47.0, "elapsed_time": "8:54:36", "remaining_time": "10:02:53"} +{"current_steps": 3330, "total_steps": 7064, "loss": 0.8057, "reward": null, "learning_rate": 2.7242881040892255e-05, "epoch": 0.94, "percentage": 47.14, "elapsed_time": "8:56:11", "remaining_time": "10:01:14"} +{"current_steps": 3330, "total_steps": 7064, "loss": 0.8057, "reward": null, "learning_rate": 2.7242881040892255e-05, "epoch": 0.94, "percentage": 47.14, "elapsed_time": "9:00:05", "remaining_time": "10:05:36"} +{"current_steps": 3330, "total_steps": 7064, "loss": 0.8057, "reward": null, "learning_rate": 2.7242881040892255e-05, "epoch": 0.94, "percentage": 47.14, "elapsed_time": "8:56:12", "remaining_time": "10:01:15"} +{"current_steps": 3330, "total_steps": 7064, "loss": 0.8057, "reward": null, "learning_rate": 2.7242881040892255e-05, "epoch": 0.94, "percentage": 47.14, "elapsed_time": "8:56:10", "remaining_time": "10:01:13"} +{"current_steps": 3340, "total_steps": 7064, "loss": 0.8156, "reward": null, "learning_rate": 2.713212437088564e-05, "epoch": 0.95, "percentage": 47.28, "elapsed_time": "8:57:52", "remaining_time": "9:59:42"} +{"current_steps": 3340, "total_steps": 7064, "loss": 0.8156, "reward": null, "learning_rate": 2.713212437088564e-05, "epoch": 0.95, "percentage": 47.28, "elapsed_time": "9:01:45", "remaining_time": "10:04:02"} +{"current_steps": 3340, "total_steps": 7064, "loss": 0.8156, "reward": null, "learning_rate": 2.713212437088564e-05, "epoch": 0.95, "percentage": 47.28, "elapsed_time": "8:57:50", "remaining_time": "9:59:40"} +{"current_steps": 3340, "total_steps": 7064, "loss": 0.8156, "reward": null, "learning_rate": 2.713212437088564e-05, "epoch": 0.95, "percentage": 47.28, "elapsed_time": "8:57:51", "remaining_time": "9:59:41"} +{"current_steps": 3350, "total_steps": 7064, "loss": 0.8003, "reward": null, "learning_rate": 2.702132553023993e-05, "epoch": 0.95, "percentage": 47.42, "elapsed_time": "8:59:28", "remaining_time": "9:58:05"} +{"current_steps": 3350, "total_steps": 7064, "loss": 0.8003, "reward": null, "learning_rate": 2.702132553023993e-05, "epoch": 0.95, "percentage": 47.42, "elapsed_time": "9:03:22", "remaining_time": "10:02:24"} +{"current_steps": 3350, "total_steps": 7064, "loss": 0.8003, "reward": null, "learning_rate": 2.702132553023993e-05, "epoch": 0.95, "percentage": 47.42, "elapsed_time": "8:59:27", "remaining_time": "9:58:04"} +{"current_steps": 3350, "total_steps": 7064, "loss": 0.8003, "reward": null, "learning_rate": 2.702132553023993e-05, "epoch": 0.95, "percentage": 47.42, "elapsed_time": "8:59:29", "remaining_time": "9:58:06"} +{"current_steps": 3360, "total_steps": 7064, "loss": 0.7976, "reward": null, "learning_rate": 2.691048671041169e-05, "epoch": 0.95, "percentage": 47.57, "elapsed_time": "9:01:08", "remaining_time": "9:56:32"} +{"current_steps": 3360, "total_steps": 7064, "loss": 0.7976, "reward": null, "learning_rate": 2.691048671041169e-05, "epoch": 0.95, "percentage": 47.57, "elapsed_time": "9:01:07", "remaining_time": "9:56:31"} +{"current_steps": 3360, "total_steps": 7064, "loss": 0.7976, "reward": null, "learning_rate": 2.691048671041169e-05, "epoch": 0.95, "percentage": 47.57, "elapsed_time": "9:01:06", "remaining_time": "9:56:30"} +{"current_steps": 3360, "total_steps": 7064, "loss": 0.7976, "reward": null, "learning_rate": 2.691048671041169e-05, "epoch": 0.95, "percentage": 47.57, "elapsed_time": "9:05:00", "remaining_time": "10:00:48"} +{"current_steps": 3370, "total_steps": 7064, "loss": 0.7894, "reward": null, "learning_rate": 2.6799610103648197e-05, "epoch": 0.95, "percentage": 47.71, "elapsed_time": "9:06:39", "remaining_time": "9:59:13"} +{"current_steps": 3370, "total_steps": 7064, "loss": 0.7894, "reward": null, "learning_rate": 2.6799610103648197e-05, "epoch": 0.95, "percentage": 47.71, "elapsed_time": "9:02:47", "remaining_time": "9:54:58"} +{"current_steps": 3370, "total_steps": 7064, "loss": 0.7894, "reward": null, "learning_rate": 2.6799610103648197e-05, "epoch": 0.95, "percentage": 47.71, "elapsed_time": "9:02:45", "remaining_time": "9:54:56"} +{"current_steps": 3370, "total_steps": 7064, "loss": 0.7894, "reward": null, "learning_rate": 2.6799610103648197e-05, "epoch": 0.95, "percentage": 47.71, "elapsed_time": "9:02:46", "remaining_time": "9:54:57"} +{"current_steps": 3380, "total_steps": 7064, "loss": 0.7953, "reward": null, "learning_rate": 2.668869790294411e-05, "epoch": 0.96, "percentage": 47.85, "elapsed_time": "9:08:18", "remaining_time": "9:57:37"} +{"current_steps": 3380, "total_steps": 7064, "loss": 0.7953, "reward": null, "learning_rate": 2.668869790294411e-05, "epoch": 0.96, "percentage": 47.85, "elapsed_time": "9:04:24", "remaining_time": "9:53:22"} +{"current_steps": 3380, "total_steps": 7064, "loss": 0.7953, "reward": null, "learning_rate": 2.668869790294411e-05, "epoch": 0.96, "percentage": 47.85, "elapsed_time": "9:04:25", "remaining_time": "9:53:23"} +{"current_steps": 3380, "total_steps": 7064, "loss": 0.7953, "reward": null, "learning_rate": 2.668869790294411e-05, "epoch": 0.96, "percentage": 47.85, "elapsed_time": "9:04:23", "remaining_time": "9:53:21"} +{"current_steps": 3390, "total_steps": 7064, "loss": 0.8124, "reward": null, "learning_rate": 2.6577752301998098e-05, "epoch": 0.96, "percentage": 47.99, "elapsed_time": "9:06:03", "remaining_time": "9:51:48"} +{"current_steps": 3390, "total_steps": 7064, "loss": 0.8124, "reward": null, "learning_rate": 2.6577752301998098e-05, "epoch": 0.96, "percentage": 47.99, "elapsed_time": "9:09:56", "remaining_time": "9:56:00"} +{"current_steps": 3390, "total_steps": 7064, "loss": 0.8124, "reward": null, "learning_rate": 2.6577752301998098e-05, "epoch": 0.96, "percentage": 47.99, "elapsed_time": "9:06:02", "remaining_time": "9:51:47"} +{"current_steps": 3390, "total_steps": 7064, "loss": 0.8124, "reward": null, "learning_rate": 2.6577752301998098e-05, "epoch": 0.96, "percentage": 47.99, "elapsed_time": "9:06:01", "remaining_time": "9:51:46"} +{"current_steps": 3400, "total_steps": 7064, "loss": 0.8073, "reward": null, "learning_rate": 2.6466775495169437e-05, "epoch": 0.96, "percentage": 48.13, "elapsed_time": "9:07:38", "remaining_time": "9:50:09"} +{"current_steps": 3400, "total_steps": 7064, "loss": 0.8073, "reward": null, "learning_rate": 2.6466775495169437e-05, "epoch": 0.96, "percentage": 48.13, "elapsed_time": "9:07:39", "remaining_time": "9:50:10"} +{"current_steps": 3400, "total_steps": 7064, "loss": 0.8073, "reward": null, "learning_rate": 2.6466775495169437e-05, "epoch": 0.96, "percentage": 48.13, "elapsed_time": "9:07:37", "remaining_time": "9:50:08"} +{"current_steps": 3400, "total_steps": 7064, "loss": 0.8073, "reward": null, "learning_rate": 2.6466775495169437e-05, "epoch": 0.96, "percentage": 48.13, "elapsed_time": "9:11:32", "remaining_time": "9:54:21"} +{"current_steps": 3410, "total_steps": 7064, "loss": 0.7979, "reward": null, "learning_rate": 2.6355769677434628e-05, "epoch": 0.97, "percentage": 48.27, "elapsed_time": "9:13:08", "remaining_time": "9:52:42"} +{"current_steps": 3410, "total_steps": 7064, "loss": 0.7979, "reward": null, "learning_rate": 2.6355769677434628e-05, "epoch": 0.97, "percentage": 48.27, "elapsed_time": "9:09:15", "remaining_time": "9:48:33"} +{"current_steps": 3410, "total_steps": 7064, "loss": 0.7979, "reward": null, "learning_rate": 2.6355769677434628e-05, "epoch": 0.97, "percentage": 48.27, "elapsed_time": "9:09:13", "remaining_time": "9:48:31"} +{"current_steps": 3410, "total_steps": 7064, "loss": 0.7979, "reward": null, "learning_rate": 2.6355769677434628e-05, "epoch": 0.97, "percentage": 48.27, "elapsed_time": "9:09:14", "remaining_time": "9:48:32"} +{"current_steps": 3420, "total_steps": 7064, "loss": 0.8023, "reward": null, "learning_rate": 2.6244737044343954e-05, "epoch": 0.97, "percentage": 48.41, "elapsed_time": "9:10:51", "remaining_time": "9:46:56"} +{"current_steps": 3420, "total_steps": 7064, "loss": 0.8023, "reward": null, "learning_rate": 2.6244737044343954e-05, "epoch": 0.97, "percentage": 48.41, "elapsed_time": "9:10:50", "remaining_time": "9:46:55"} +{"current_steps": 3420, "total_steps": 7064, "loss": 0.8023, "reward": null, "learning_rate": 2.6244737044343954e-05, "epoch": 0.97, "percentage": 48.41, "elapsed_time": "9:10:49", "remaining_time": "9:46:54"} +{"current_steps": 3420, "total_steps": 7064, "loss": 0.8023, "reward": null, "learning_rate": 2.6244737044343954e-05, "epoch": 0.97, "percentage": 48.41, "elapsed_time": "9:14:44", "remaining_time": "9:51:04"} +{"current_steps": 3430, "total_steps": 7064, "loss": 0.8046, "reward": null, "learning_rate": 2.6133679791978065e-05, "epoch": 0.97, "percentage": 48.56, "elapsed_time": "9:12:26", "remaining_time": "9:45:18"} +{"current_steps": 3430, "total_steps": 7064, "loss": 0.8046, "reward": null, "learning_rate": 2.6133679791978065e-05, "epoch": 0.97, "percentage": 48.56, "elapsed_time": "9:16:20", "remaining_time": "9:49:25"} +{"current_steps": 3430, "total_steps": 7064, "loss": 0.8046, "reward": null, "learning_rate": 2.6133679791978065e-05, "epoch": 0.97, "percentage": 48.56, "elapsed_time": "9:12:27", "remaining_time": "9:45:18"} +{"current_steps": 3430, "total_steps": 7064, "loss": 0.8046, "reward": null, "learning_rate": 2.6133679791978065e-05, "epoch": 0.97, "percentage": 48.56, "elapsed_time": "9:12:25", "remaining_time": "9:45:17"} +{"current_steps": 3440, "total_steps": 7064, "loss": 0.8082, "reward": null, "learning_rate": 2.602260011690457e-05, "epoch": 0.97, "percentage": 48.7, "elapsed_time": "9:14:03", "remaining_time": "9:43:41"} +{"current_steps": 3440, "total_steps": 7064, "loss": 0.8082, "reward": null, "learning_rate": 2.602260011690457e-05, "epoch": 0.97, "percentage": 48.7, "elapsed_time": "9:14:04", "remaining_time": "9:43:42"} +{"current_steps": 3440, "total_steps": 7064, "loss": 0.8082, "reward": null, "learning_rate": 2.602260011690457e-05, "epoch": 0.97, "percentage": 48.7, "elapsed_time": "9:14:02", "remaining_time": "9:43:40"} +{"current_steps": 3440, "total_steps": 7064, "loss": 0.8082, "reward": null, "learning_rate": 2.602260011690457e-05, "epoch": 0.97, "percentage": 48.7, "elapsed_time": "9:17:56", "remaining_time": "9:47:47"} +{"current_steps": 3450, "total_steps": 7064, "loss": 0.7868, "reward": null, "learning_rate": 2.591150021613456e-05, "epoch": 0.98, "percentage": 48.84, "elapsed_time": "9:15:41", "remaining_time": "9:42:06"} +{"current_steps": 3450, "total_steps": 7064, "loss": 0.7868, "reward": null, "learning_rate": 2.591150021613456e-05, "epoch": 0.98, "percentage": 48.84, "elapsed_time": "9:19:34", "remaining_time": "9:46:10"} +{"current_steps": 3450, "total_steps": 7064, "loss": 0.7868, "reward": null, "learning_rate": 2.591150021613456e-05, "epoch": 0.98, "percentage": 48.84, "elapsed_time": "9:15:42", "remaining_time": "9:42:06"} +{"current_steps": 3450, "total_steps": 7064, "loss": 0.7868, "reward": null, "learning_rate": 2.591150021613456e-05, "epoch": 0.98, "percentage": 48.84, "elapsed_time": "9:15:40", "remaining_time": "9:42:05"} +{"current_steps": 3460, "total_steps": 7064, "loss": 0.7938, "reward": null, "learning_rate": 2.580038228707916e-05, "epoch": 0.98, "percentage": 48.98, "elapsed_time": "9:21:11", "remaining_time": "9:44:33"} +{"current_steps": 3460, "total_steps": 7064, "loss": 0.7938, "reward": null, "learning_rate": 2.580038228707916e-05, "epoch": 0.98, "percentage": 48.98, "elapsed_time": "9:17:18", "remaining_time": "9:40:30"} +{"current_steps": 3460, "total_steps": 7064, "loss": 0.7938, "reward": null, "learning_rate": 2.580038228707916e-05, "epoch": 0.98, "percentage": 48.98, "elapsed_time": "9:17:17", "remaining_time": "9:40:28"} +{"current_steps": 3460, "total_steps": 7064, "loss": 0.7938, "reward": null, "learning_rate": 2.580038228707916e-05, "epoch": 0.98, "percentage": 48.98, "elapsed_time": "9:17:17", "remaining_time": "9:40:29"} +{"current_steps": 3470, "total_steps": 7064, "loss": 0.8215, "reward": null, "learning_rate": 2.568924852750607e-05, "epoch": 0.98, "percentage": 49.12, "elapsed_time": "9:22:45", "remaining_time": "9:42:52"} +{"current_steps": 3470, "total_steps": 7064, "loss": 0.8215, "reward": null, "learning_rate": 2.568924852750607e-05, "epoch": 0.98, "percentage": 49.12, "elapsed_time": "9:18:51", "remaining_time": "9:38:49"} +{"current_steps": 3470, "total_steps": 7064, "loss": 0.8215, "reward": null, "learning_rate": 2.568924852750607e-05, "epoch": 0.98, "percentage": 49.12, "elapsed_time": "9:18:52", "remaining_time": "9:38:51"} +{"current_steps": 3470, "total_steps": 7064, "loss": 0.8215, "reward": null, "learning_rate": 2.568924852750607e-05, "epoch": 0.98, "percentage": 49.12, "elapsed_time": "9:18:52", "remaining_time": "9:38:50"} +{"current_steps": 3480, "total_steps": 7064, "loss": 0.807, "reward": null, "learning_rate": 2.55781011354961e-05, "epoch": 0.99, "percentage": 49.26, "elapsed_time": "9:24:25", "remaining_time": "9:41:17"} +{"current_steps": 3480, "total_steps": 7064, "loss": 0.807, "reward": null, "learning_rate": 2.55781011354961e-05, "epoch": 0.99, "percentage": 49.26, "elapsed_time": "9:20:31", "remaining_time": "9:37:16"} +{"current_steps": 3480, "total_steps": 7064, "loss": 0.807, "reward": null, "learning_rate": 2.55781011354961e-05, "epoch": 0.99, "percentage": 49.26, "elapsed_time": "9:20:32", "remaining_time": "9:37:17"} +{"current_steps": 3480, "total_steps": 7064, "loss": 0.807, "reward": null, "learning_rate": 2.55781011354961e-05, "epoch": 0.99, "percentage": 49.26, "elapsed_time": "9:20:31", "remaining_time": "9:37:17"} +{"current_steps": 3490, "total_steps": 7064, "loss": 0.7878, "reward": null, "learning_rate": 2.5466942309399706e-05, "epoch": 0.99, "percentage": 49.41, "elapsed_time": "9:26:06", "remaining_time": "9:39:43"} +{"current_steps": 3490, "total_steps": 7064, "loss": 0.7878, "reward": null, "learning_rate": 2.5466942309399706e-05, "epoch": 0.99, "percentage": 49.41, "elapsed_time": "9:22:13", "remaining_time": "9:35:45"} +{"current_steps": 3490, "total_steps": 7064, "loss": 0.7878, "reward": null, "learning_rate": 2.5466942309399706e-05, "epoch": 0.99, "percentage": 49.41, "elapsed_time": "9:22:11", "remaining_time": "9:35:43"} +{"current_steps": 3490, "total_steps": 7064, "loss": 0.7878, "reward": null, "learning_rate": 2.5466942309399706e-05, "epoch": 0.99, "percentage": 49.41, "elapsed_time": "9:22:12", "remaining_time": "9:35:44"} +{"current_steps": 3500, "total_steps": 7064, "loss": 0.7968, "reward": null, "learning_rate": 2.535577424779347e-05, "epoch": 0.99, "percentage": 49.55, "elapsed_time": "9:23:50", "remaining_time": "9:34:09"} +{"current_steps": 3500, "total_steps": 7064, "loss": 0.7968, "reward": null, "learning_rate": 2.535577424779347e-05, "epoch": 0.99, "percentage": 49.55, "elapsed_time": "9:27:44", "remaining_time": "9:38:07"} +{"current_steps": 3500, "total_steps": 7064, "loss": 0.7968, "reward": null, "learning_rate": 2.535577424779347e-05, "epoch": 0.99, "percentage": 49.55, "elapsed_time": "9:23:49", "remaining_time": "9:34:08"} +{"current_steps": 3500, "total_steps": 7064, "loss": 0.7968, "reward": null, "learning_rate": 2.535577424779347e-05, "epoch": 0.99, "percentage": 49.55, "elapsed_time": "9:23:51", "remaining_time": "9:34:10"} +{"current_steps": 3510, "total_steps": 7064, "loss": 0.787, "reward": null, "learning_rate": 2.5244599149436642e-05, "epoch": 0.99, "percentage": 49.69, "elapsed_time": "9:25:31", "remaining_time": "9:32:36"} +{"current_steps": 3510, "total_steps": 7064, "loss": 0.787, "reward": null, "learning_rate": 2.5244599149436642e-05, "epoch": 0.99, "percentage": 49.69, "elapsed_time": "9:25:32", "remaining_time": "9:32:37"} +{"current_steps": 3510, "total_steps": 7064, "loss": 0.787, "reward": null, "learning_rate": 2.5244599149436642e-05, "epoch": 0.99, "percentage": 49.69, "elapsed_time": "9:25:30", "remaining_time": "9:32:35"} +{"current_steps": 3510, "total_steps": 7064, "loss": 0.787, "reward": null, "learning_rate": 2.5244599149436642e-05, "epoch": 0.99, "percentage": 49.69, "elapsed_time": "9:29:25", "remaining_time": "9:36:33"} +{"current_steps": 3520, "total_steps": 7064, "loss": 0.8011, "reward": null, "learning_rate": 2.5133419213227684e-05, "epoch": 1.0, "percentage": 49.83, "elapsed_time": "9:27:09", "remaining_time": "9:31:01"} +{"current_steps": 3520, "total_steps": 7064, "loss": 0.8011, "reward": null, "learning_rate": 2.5133419213227684e-05, "epoch": 1.0, "percentage": 49.83, "elapsed_time": "9:27:10", "remaining_time": "9:31:02"} +{"current_steps": 3520, "total_steps": 7064, "loss": 0.8011, "reward": null, "learning_rate": 2.5133419213227684e-05, "epoch": 1.0, "percentage": 49.83, "elapsed_time": "9:27:11", "remaining_time": "9:31:03"} +{"current_steps": 3520, "total_steps": 7064, "loss": 0.8011, "reward": null, "learning_rate": 2.5133419213227684e-05, "epoch": 1.0, "percentage": 49.83, "elapsed_time": "9:31:03", "remaining_time": "9:34:57"} +{"current_steps": 3530, "total_steps": 7064, "loss": 0.8086, "reward": null, "learning_rate": 2.5022236638160712e-05, "epoch": 1.0, "percentage": 49.97, "elapsed_time": "9:32:40", "remaining_time": "9:33:19"} +{"current_steps": 3530, "total_steps": 7064, "loss": 0.8086, "reward": null, "learning_rate": 2.5022236638160712e-05, "epoch": 1.0, "percentage": 49.97, "elapsed_time": "9:28:47", "remaining_time": "9:29:25"} +{"current_steps": 3530, "total_steps": 7064, "loss": 0.8086, "reward": null, "learning_rate": 2.5022236638160712e-05, "epoch": 1.0, "percentage": 49.97, "elapsed_time": "9:28:46", "remaining_time": "9:29:24"} +{"current_steps": 3530, "total_steps": 7064, "loss": 0.8086, "reward": null, "learning_rate": 2.5022236638160712e-05, "epoch": 1.0, "percentage": 49.97, "elapsed_time": "9:28:47", "remaining_time": "9:29:26"} +{"current_steps": 3540, "total_steps": 7064, "loss": 0.8125, "reward": null, "learning_rate": 2.491105362328204e-05, "epoch": 1.0, "percentage": 50.11, "elapsed_time": "9:30:25", "remaining_time": "9:27:50"} +{"current_steps": 3540, "total_steps": 7064, "loss": 0.8125, "reward": null, "learning_rate": 2.491105362328204e-05, "epoch": 1.0, "percentage": 50.11, "elapsed_time": "9:30:24", "remaining_time": "9:27:49"} +{"current_steps": 3540, "total_steps": 7064, "loss": 0.8125, "reward": null, "learning_rate": 2.491105362328204e-05, "epoch": 1.0, "percentage": 50.11, "elapsed_time": "9:30:23", "remaining_time": "9:27:49"} +{"current_steps": 3540, "total_steps": 7064, "loss": 0.8125, "reward": null, "learning_rate": 2.491105362328204e-05, "epoch": 1.0, "percentage": 50.11, "elapsed_time": "9:34:18", "remaining_time": "9:31:42"} +{"current_steps": 3550, "total_steps": 7064, "loss": 0.8125, "reward": null, "learning_rate": 2.4799872367646685e-05, "epoch": 1.01, "percentage": 50.25, "elapsed_time": "9:31:59", "remaining_time": "9:26:11"} +{"current_steps": 3550, "total_steps": 7064, "loss": 0.8125, "reward": null, "learning_rate": 2.4799872367646685e-05, "epoch": 1.01, "percentage": 50.25, "elapsed_time": "9:31:58", "remaining_time": "9:26:10"} +{"current_steps": 3550, "total_steps": 7064, "loss": 0.8125, "reward": null, "learning_rate": 2.4799872367646685e-05, "epoch": 1.01, "percentage": 50.25, "elapsed_time": "9:31:57", "remaining_time": "9:26:09"} +{"current_steps": 3550, "total_steps": 7064, "loss": 0.8125, "reward": null, "learning_rate": 2.4799872367646685e-05, "epoch": 1.01, "percentage": 50.25, "elapsed_time": "9:35:52", "remaining_time": "9:30:01"} +{"current_steps": 3560, "total_steps": 7064, "loss": 0.7805, "reward": null, "learning_rate": 2.468869507027486e-05, "epoch": 1.01, "percentage": 50.4, "elapsed_time": "9:33:35", "remaining_time": "9:24:34"} +{"current_steps": 3560, "total_steps": 7064, "loss": 0.7805, "reward": null, "learning_rate": 2.468869507027486e-05, "epoch": 1.01, "percentage": 50.4, "elapsed_time": "9:37:29", "remaining_time": "9:28:24"} +{"current_steps": 3560, "total_steps": 7064, "loss": 0.7805, "reward": null, "learning_rate": 2.468869507027486e-05, "epoch": 1.01, "percentage": 50.4, "elapsed_time": "9:33:36", "remaining_time": "9:24:34"} +{"current_steps": 3560, "total_steps": 7064, "loss": 0.7805, "reward": null, "learning_rate": 2.468869507027486e-05, "epoch": 1.01, "percentage": 50.4, "elapsed_time": "9:33:34", "remaining_time": "9:24:33"} +{"current_steps": 3570, "total_steps": 7064, "loss": 0.817, "reward": null, "learning_rate": 2.457752393010851e-05, "epoch": 1.01, "percentage": 50.54, "elapsed_time": "9:39:08", "remaining_time": "9:26:48"} +{"current_steps": 3570, "total_steps": 7064, "loss": 0.817, "reward": null, "learning_rate": 2.457752393010851e-05, "epoch": 1.01, "percentage": 50.54, "elapsed_time": "9:35:14", "remaining_time": "9:22:59"} +{"current_steps": 3570, "total_steps": 7064, "loss": 0.817, "reward": null, "learning_rate": 2.457752393010851e-05, "epoch": 1.01, "percentage": 50.54, "elapsed_time": "9:35:13", "remaining_time": "9:22:58"} +{"current_steps": 3570, "total_steps": 7064, "loss": 0.817, "reward": null, "learning_rate": 2.457752393010851e-05, "epoch": 1.01, "percentage": 50.54, "elapsed_time": "9:35:15", "remaining_time": "9:23:00"} +{"current_steps": 3580, "total_steps": 7064, "loss": 0.8056, "reward": null, "learning_rate": 2.4466361145967782e-05, "epoch": 1.01, "percentage": 50.68, "elapsed_time": "9:36:51", "remaining_time": "9:21:23"} +{"current_steps": 3580, "total_steps": 7064, "loss": 0.8056, "reward": null, "learning_rate": 2.4466361145967782e-05, "epoch": 1.01, "percentage": 50.68, "elapsed_time": "9:40:45", "remaining_time": "9:25:10"} +{"current_steps": 3580, "total_steps": 7064, "loss": 0.8056, "reward": null, "learning_rate": 2.4466361145967782e-05, "epoch": 1.01, "percentage": 50.68, "elapsed_time": "9:36:52", "remaining_time": "9:21:24"} +{"current_steps": 3580, "total_steps": 7064, "loss": 0.8056, "reward": null, "learning_rate": 2.4466361145967782e-05, "epoch": 1.01, "percentage": 50.68, "elapsed_time": "9:36:50", "remaining_time": "9:21:22"} +{"current_steps": 3590, "total_steps": 7064, "loss": 0.7752, "reward": null, "learning_rate": 2.4355208916507554e-05, "epoch": 1.02, "percentage": 50.82, "elapsed_time": "9:42:24", "remaining_time": "9:23:35"} +{"current_steps": 3590, "total_steps": 7064, "loss": 0.7752, "reward": null, "learning_rate": 2.4355208916507554e-05, "epoch": 1.02, "percentage": 50.82, "elapsed_time": "9:38:31", "remaining_time": "9:19:49"} +{"current_steps": 3590, "total_steps": 7064, "loss": 0.7752, "reward": null, "learning_rate": 2.4355208916507554e-05, "epoch": 1.02, "percentage": 50.82, "elapsed_time": "9:38:30", "remaining_time": "9:19:49"} +{"current_steps": 3590, "total_steps": 7064, "loss": 0.7752, "reward": null, "learning_rate": 2.4355208916507554e-05, "epoch": 1.02, "percentage": 50.82, "elapsed_time": "9:38:29", "remaining_time": "9:19:48"} +{"current_steps": 3600, "total_steps": 7064, "loss": 0.7749, "reward": null, "learning_rate": 2.4244069440173938e-05, "epoch": 1.02, "percentage": 50.96, "elapsed_time": "9:40:08", "remaining_time": "9:18:13"} +{"current_steps": 3600, "total_steps": 7064, "loss": 0.7749, "reward": null, "learning_rate": 2.4244069440173938e-05, "epoch": 1.02, "percentage": 50.96, "elapsed_time": "9:40:07", "remaining_time": "9:18:12"} +{"current_steps": 3600, "total_steps": 7064, "loss": 0.7749, "reward": null, "learning_rate": 2.4244069440173938e-05, "epoch": 1.02, "percentage": 50.96, "elapsed_time": "9:40:06", "remaining_time": "9:18:12"} +{"current_steps": 3600, "total_steps": 7064, "loss": 0.7749, "reward": null, "learning_rate": 2.4244069440173938e-05, "epoch": 1.02, "percentage": 50.96, "elapsed_time": "9:44:01", "remaining_time": "9:21:57"} +{"current_steps": 3610, "total_steps": 7064, "loss": 0.8073, "reward": null, "learning_rate": 2.413294491516083e-05, "epoch": 1.02, "percentage": 51.1, "elapsed_time": "9:41:46", "remaining_time": "9:16:37"} +{"current_steps": 3610, "total_steps": 7064, "loss": 0.8073, "reward": null, "learning_rate": 2.413294491516083e-05, "epoch": 1.02, "percentage": 51.1, "elapsed_time": "9:41:45", "remaining_time": "9:16:36"} +{"current_steps": 3610, "total_steps": 7064, "loss": 0.8073, "reward": null, "learning_rate": 2.413294491516083e-05, "epoch": 1.02, "percentage": 51.1, "elapsed_time": "9:45:38", "remaining_time": "9:20:20"} +{"current_steps": 3610, "total_steps": 7064, "loss": 0.8073, "reward": null, "learning_rate": 2.413294491516083e-05, "epoch": 1.02, "percentage": 51.1, "elapsed_time": "9:41:44", "remaining_time": "9:16:36"} +{"current_steps": 3620, "total_steps": 7064, "loss": 0.8117, "reward": null, "learning_rate": 2.402183753936639e-05, "epoch": 1.02, "percentage": 51.25, "elapsed_time": "9:43:22", "remaining_time": "9:15:00"} +{"current_steps": 3620, "total_steps": 7064, "loss": 0.8117, "reward": null, "learning_rate": 2.402183753936639e-05, "epoch": 1.02, "percentage": 51.25, "elapsed_time": "9:47:16", "remaining_time": "9:18:42"} +{"current_steps": 3620, "total_steps": 7064, "loss": 0.8117, "reward": null, "learning_rate": 2.402183753936639e-05, "epoch": 1.02, "percentage": 51.25, "elapsed_time": "9:43:21", "remaining_time": "9:14:59"} +{"current_steps": 3620, "total_steps": 7064, "loss": 0.8117, "reward": null, "learning_rate": 2.402183753936639e-05, "epoch": 1.02, "percentage": 51.25, "elapsed_time": "9:43:23", "remaining_time": "9:15:01"} +{"current_steps": 3630, "total_steps": 7064, "loss": 0.8008, "reward": null, "learning_rate": 2.3910749510349574e-05, "epoch": 1.03, "percentage": 51.39, "elapsed_time": "9:48:54", "remaining_time": "9:17:06"} +{"current_steps": 3630, "total_steps": 7064, "loss": 0.8008, "reward": null, "learning_rate": 2.3910749510349574e-05, "epoch": 1.03, "percentage": 51.39, "elapsed_time": "9:45:00", "remaining_time": "9:13:25"} +{"current_steps": 3630, "total_steps": 7064, "loss": 0.8008, "reward": null, "learning_rate": 2.3910749510349574e-05, "epoch": 1.03, "percentage": 51.39, "elapsed_time": "9:44:59", "remaining_time": "9:13:24"} +{"current_steps": 3630, "total_steps": 7064, "loss": 0.8008, "reward": null, "learning_rate": 2.3910749510349574e-05, "epoch": 1.03, "percentage": 51.39, "elapsed_time": "9:45:01", "remaining_time": "9:13:25"} +{"current_steps": 3640, "total_steps": 7064, "loss": 0.8028, "reward": null, "learning_rate": 2.3799683025286727e-05, "epoch": 1.03, "percentage": 51.53, "elapsed_time": "9:50:29", "remaining_time": "9:15:26"} +{"current_steps": 3640, "total_steps": 7064, "loss": 0.8028, "reward": null, "learning_rate": 2.3799683025286727e-05, "epoch": 1.03, "percentage": 51.53, "elapsed_time": "9:46:34", "remaining_time": "9:11:46"} +{"current_steps": 3640, "total_steps": 7064, "loss": 0.8028, "reward": null, "learning_rate": 2.3799683025286727e-05, "epoch": 1.03, "percentage": 51.53, "elapsed_time": "9:46:36", "remaining_time": "9:11:47"} +{"current_steps": 3640, "total_steps": 7064, "loss": 0.8028, "reward": null, "learning_rate": 2.3799683025286727e-05, "epoch": 1.03, "percentage": 51.53, "elapsed_time": "9:46:35", "remaining_time": "9:11:47"} +{"current_steps": 3650, "total_steps": 7064, "loss": 0.7974, "reward": null, "learning_rate": 2.3688640280928043e-05, "epoch": 1.03, "percentage": 51.67, "elapsed_time": "9:48:10", "remaining_time": "9:10:08"} +{"current_steps": 3650, "total_steps": 7064, "loss": 0.7974, "reward": null, "learning_rate": 2.3688640280928043e-05, "epoch": 1.03, "percentage": 51.67, "elapsed_time": "9:48:11", "remaining_time": "9:10:09"} +{"current_steps": 3650, "total_steps": 7064, "loss": 0.7974, "reward": null, "learning_rate": 2.3688640280928043e-05, "epoch": 1.03, "percentage": 51.67, "elapsed_time": "9:48:09", "remaining_time": "9:10:07"} +{"current_steps": 3650, "total_steps": 7064, "loss": 0.7974, "reward": null, "learning_rate": 2.3688640280928043e-05, "epoch": 1.03, "percentage": 51.67, "elapsed_time": "9:52:03", "remaining_time": "9:13:47"} +{"current_steps": 3660, "total_steps": 7064, "loss": 0.7867, "reward": null, "learning_rate": 2.357762347355418e-05, "epoch": 1.04, "percentage": 51.81, "elapsed_time": "9:49:47", "remaining_time": "9:08:32"} +{"current_steps": 3660, "total_steps": 7064, "loss": 0.7867, "reward": null, "learning_rate": 2.357762347355418e-05, "epoch": 1.04, "percentage": 51.81, "elapsed_time": "9:49:46", "remaining_time": "9:08:31"} +{"current_steps": 3660, "total_steps": 7064, "loss": 0.7867, "reward": null, "learning_rate": 2.357762347355418e-05, "epoch": 1.04, "percentage": 51.81, "elapsed_time": "9:53:40", "remaining_time": "9:12:08"} +{"current_steps": 3660, "total_steps": 7064, "loss": 0.7867, "reward": null, "learning_rate": 2.357762347355418e-05, "epoch": 1.04, "percentage": 51.81, "elapsed_time": "9:49:45", "remaining_time": "9:08:30"} +{"current_steps": 3670, "total_steps": 7064, "loss": 0.8002, "reward": null, "learning_rate": 2.346663479893277e-05, "epoch": 1.04, "percentage": 51.95, "elapsed_time": "9:55:15", "remaining_time": "9:10:29"} +{"current_steps": 3670, "total_steps": 7064, "loss": 0.8002, "reward": null, "learning_rate": 2.346663479893277e-05, "epoch": 1.04, "percentage": 51.95, "elapsed_time": "9:51:22", "remaining_time": "9:06:54"} +{"current_steps": 3670, "total_steps": 7064, "loss": 0.8002, "reward": null, "learning_rate": 2.346663479893277e-05, "epoch": 1.04, "percentage": 51.95, "elapsed_time": "9:51:20", "remaining_time": "9:06:52"} +{"current_steps": 3670, "total_steps": 7064, "loss": 0.8002, "reward": null, "learning_rate": 2.346663479893277e-05, "epoch": 1.04, "percentage": 51.95, "elapsed_time": "9:51:21", "remaining_time": "9:06:53"} +{"current_steps": 3680, "total_steps": 7064, "loss": 0.8095, "reward": null, "learning_rate": 2.3355676452275057e-05, "epoch": 1.04, "percentage": 52.1, "elapsed_time": "9:52:59", "remaining_time": "9:05:17"} +{"current_steps": 3680, "total_steps": 7064, "loss": 0.8095, "reward": null, "learning_rate": 2.3355676452275057e-05, "epoch": 1.04, "percentage": 52.1, "elapsed_time": "9:56:53", "remaining_time": "9:08:52"} +{"current_steps": 3680, "total_steps": 7064, "loss": 0.8095, "reward": null, "learning_rate": 2.3355676452275057e-05, "epoch": 1.04, "percentage": 52.1, "elapsed_time": "9:53:00", "remaining_time": "9:05:18"} +{"current_steps": 3680, "total_steps": 7064, "loss": 0.8095, "reward": null, "learning_rate": 2.3355676452275057e-05, "epoch": 1.04, "percentage": 52.1, "elapsed_time": "9:52:58", "remaining_time": "9:05:16"} +{"current_steps": 3690, "total_steps": 7064, "loss": 0.7847, "reward": null, "learning_rate": 2.3244750628192395e-05, "epoch": 1.04, "percentage": 52.24, "elapsed_time": "9:58:29", "remaining_time": "9:07:14"} +{"current_steps": 3690, "total_steps": 7064, "loss": 0.7847, "reward": null, "learning_rate": 2.3244750628192395e-05, "epoch": 1.04, "percentage": 52.24, "elapsed_time": "9:54:36", "remaining_time": "9:03:41"} +{"current_steps": 3690, "total_steps": 7064, "loss": 0.7847, "reward": null, "learning_rate": 2.3244750628192395e-05, "epoch": 1.04, "percentage": 52.24, "elapsed_time": "9:54:35", "remaining_time": "9:03:40"} +{"current_steps": 3690, "total_steps": 7064, "loss": 0.7847, "reward": null, "learning_rate": 2.3244750628192395e-05, "epoch": 1.04, "percentage": 52.24, "elapsed_time": "9:54:34", "remaining_time": "9:03:39"} +{"current_steps": 3700, "total_steps": 7064, "loss": 0.7693, "reward": null, "learning_rate": 2.313385952065291e-05, "epoch": 1.05, "percentage": 52.38, "elapsed_time": "10:00:07", "remaining_time": "9:05:37"} +{"current_steps": 3700, "total_steps": 7064, "loss": 0.7693, "reward": null, "learning_rate": 2.313385952065291e-05, "epoch": 1.05, "percentage": 52.38, "elapsed_time": "9:56:14", "remaining_time": "9:02:05"} +{"current_steps": 3700, "total_steps": 7064, "loss": 0.7693, "reward": null, "learning_rate": 2.313385952065291e-05, "epoch": 1.05, "percentage": 52.38, "elapsed_time": "9:56:12", "remaining_time": "9:02:03"} +{"current_steps": 3700, "total_steps": 7064, "loss": 0.7693, "reward": null, "learning_rate": 2.313385952065291e-05, "epoch": 1.05, "percentage": 52.38, "elapsed_time": "9:56:13", "remaining_time": "9:02:04"} +{"current_steps": 3710, "total_steps": 7064, "loss": 0.8078, "reward": null, "learning_rate": 2.302300532293806e-05, "epoch": 1.05, "percentage": 52.52, "elapsed_time": "9:57:50", "remaining_time": "9:00:28"} +{"current_steps": 3710, "total_steps": 7064, "loss": 0.8078, "reward": null, "learning_rate": 2.302300532293806e-05, "epoch": 1.05, "percentage": 52.52, "elapsed_time": "9:57:51", "remaining_time": "9:00:28"} +{"current_steps": 3710, "total_steps": 7064, "loss": 0.8078, "reward": null, "learning_rate": 2.302300532293806e-05, "epoch": 1.05, "percentage": 52.52, "elapsed_time": "9:57:49", "remaining_time": "9:00:27"} +{"current_steps": 3710, "total_steps": 7064, "loss": 0.8078, "reward": null, "learning_rate": 2.302300532293806e-05, "epoch": 1.05, "percentage": 52.52, "elapsed_time": "10:01:43", "remaining_time": "9:03:59"} +{"current_steps": 3720, "total_steps": 7064, "loss": 0.7925, "reward": null, "learning_rate": 2.2912190227599305e-05, "epoch": 1.05, "percentage": 52.66, "elapsed_time": "10:03:21", "remaining_time": "9:02:22"} +{"current_steps": 3720, "total_steps": 7064, "loss": 0.7925, "reward": null, "learning_rate": 2.2912190227599305e-05, "epoch": 1.05, "percentage": 52.66, "elapsed_time": "9:59:28", "remaining_time": "8:58:52"} +{"current_steps": 3720, "total_steps": 7064, "loss": 0.7925, "reward": null, "learning_rate": 2.2912190227599305e-05, "epoch": 1.05, "percentage": 52.66, "elapsed_time": "9:59:26", "remaining_time": "8:58:51"} +{"current_steps": 3720, "total_steps": 7064, "loss": 0.7925, "reward": null, "learning_rate": 2.2912190227599305e-05, "epoch": 1.05, "percentage": 52.66, "elapsed_time": "9:59:27", "remaining_time": "8:58:52"} +{"current_steps": 3730, "total_steps": 7064, "loss": 0.77, "reward": null, "learning_rate": 2.280141642641468e-05, "epoch": 1.06, "percentage": 52.8, "elapsed_time": "10:01:04", "remaining_time": "8:57:16"} +{"current_steps": 3730, "total_steps": 7064, "loss": 0.77, "reward": null, "learning_rate": 2.280141642641468e-05, "epoch": 1.06, "percentage": 52.8, "elapsed_time": "10:04:57", "remaining_time": "9:00:44"} +{"current_steps": 3730, "total_steps": 7064, "loss": 0.77, "reward": null, "learning_rate": 2.280141642641468e-05, "epoch": 1.06, "percentage": 52.8, "elapsed_time": "10:01:04", "remaining_time": "8:57:15"} +{"current_steps": 3730, "total_steps": 7064, "loss": 0.77, "reward": null, "learning_rate": 2.280141642641468e-05, "epoch": 1.06, "percentage": 52.8, "elapsed_time": "10:01:03", "remaining_time": "8:57:14"} +{"current_steps": 3740, "total_steps": 7064, "loss": 0.7962, "reward": null, "learning_rate": 2.26906861103455e-05, "epoch": 1.06, "percentage": 52.94, "elapsed_time": "10:02:43", "remaining_time": "8:55:41"} +{"current_steps": 3740, "total_steps": 7064, "loss": 0.7962, "reward": null, "learning_rate": 2.26906861103455e-05, "epoch": 1.06, "percentage": 52.94, "elapsed_time": "10:06:37", "remaining_time": "8:59:08"} +{"current_steps": 3740, "total_steps": 7064, "loss": 0.7962, "reward": null, "learning_rate": 2.26906861103455e-05, "epoch": 1.06, "percentage": 52.94, "elapsed_time": "10:02:42", "remaining_time": "8:55:40"} +{"current_steps": 3740, "total_steps": 7064, "loss": 0.7962, "reward": null, "learning_rate": 2.26906861103455e-05, "epoch": 1.06, "percentage": 52.94, "elapsed_time": "10:02:44", "remaining_time": "8:55:41"} +{"current_steps": 3750, "total_steps": 7064, "loss": 0.8014, "reward": null, "learning_rate": 2.2580001469492968e-05, "epoch": 1.06, "percentage": 53.09, "elapsed_time": "10:04:25", "remaining_time": "8:54:09"} +{"current_steps": 3750, "total_steps": 7064, "loss": 0.8014, "reward": null, "learning_rate": 2.2580001469492968e-05, "epoch": 1.06, "percentage": 53.09, "elapsed_time": "10:08:18", "remaining_time": "8:57:34"} +{"current_steps": 3750, "total_steps": 7064, "loss": 0.8014, "reward": null, "learning_rate": 2.2580001469492968e-05, "epoch": 1.06, "percentage": 53.09, "elapsed_time": "10:04:24", "remaining_time": "8:54:08"} +{"current_steps": 3750, "total_steps": 7064, "loss": 0.8014, "reward": null, "learning_rate": 2.2580001469492968e-05, "epoch": 1.06, "percentage": 53.09, "elapsed_time": "10:04:23", "remaining_time": "8:54:07"} +{"current_steps": 3760, "total_steps": 7064, "loss": 0.7934, "reward": null, "learning_rate": 2.2469364693054938e-05, "epoch": 1.06, "percentage": 53.23, "elapsed_time": "10:06:00", "remaining_time": "8:52:30"} +{"current_steps": 3760, "total_steps": 7064, "loss": 0.7934, "reward": null, "learning_rate": 2.2469364693054938e-05, "epoch": 1.06, "percentage": 53.23, "elapsed_time": "10:09:53", "remaining_time": "8:55:55"} +{"current_steps": 3760, "total_steps": 7064, "loss": 0.7934, "reward": null, "learning_rate": 2.2469364693054938e-05, "epoch": 1.06, "percentage": 53.23, "elapsed_time": "10:05:58", "remaining_time": "8:52:29"} +{"current_steps": 3760, "total_steps": 7064, "loss": 0.7934, "reward": null, "learning_rate": 2.2469364693054938e-05, "epoch": 1.06, "percentage": 53.23, "elapsed_time": "10:05:59", "remaining_time": "8:52:30"} +{"current_steps": 3770, "total_steps": 7064, "loss": 0.7978, "reward": null, "learning_rate": 2.235877796928252e-05, "epoch": 1.07, "percentage": 53.37, "elapsed_time": "10:07:39", "remaining_time": "8:50:56"} +{"current_steps": 3770, "total_steps": 7064, "loss": 0.7978, "reward": null, "learning_rate": 2.235877796928252e-05, "epoch": 1.07, "percentage": 53.37, "elapsed_time": "10:11:33", "remaining_time": "8:54:20"} +{"current_steps": 3770, "total_steps": 7064, "loss": 0.7978, "reward": null, "learning_rate": 2.235877796928252e-05, "epoch": 1.07, "percentage": 53.37, "elapsed_time": "10:07:38", "remaining_time": "8:50:55"} +{"current_steps": 3770, "total_steps": 7064, "loss": 0.7978, "reward": null, "learning_rate": 2.235877796928252e-05, "epoch": 1.07, "percentage": 53.37, "elapsed_time": "10:07:40", "remaining_time": "8:50:57"} +{"current_steps": 3780, "total_steps": 7064, "loss": 0.8022, "reward": null, "learning_rate": 2.2248243485436892e-05, "epoch": 1.07, "percentage": 53.51, "elapsed_time": "10:09:18", "remaining_time": "8:49:21"} +{"current_steps": 3780, "total_steps": 7064, "loss": 0.8022, "reward": null, "learning_rate": 2.2248243485436892e-05, "epoch": 1.07, "percentage": 53.51, "elapsed_time": "10:09:17", "remaining_time": "8:49:20"} +{"current_steps": 3780, "total_steps": 7064, "loss": 0.8022, "reward": null, "learning_rate": 2.2248243485436892e-05, "epoch": 1.07, "percentage": 53.51, "elapsed_time": "10:13:11", "remaining_time": "8:52:43"} +{"current_steps": 3780, "total_steps": 7064, "loss": 0.8022, "reward": null, "learning_rate": 2.2248243485436892e-05, "epoch": 1.07, "percentage": 53.51, "elapsed_time": "10:09:16", "remaining_time": "8:49:19"} +{"current_steps": 3790, "total_steps": 7064, "loss": 0.7934, "reward": null, "learning_rate": 2.213776342774595e-05, "epoch": 1.07, "percentage": 53.65, "elapsed_time": "10:10:52", "remaining_time": "8:47:42"} +{"current_steps": 3790, "total_steps": 7064, "loss": 0.7934, "reward": null, "learning_rate": 2.213776342774595e-05, "epoch": 1.07, "percentage": 53.65, "elapsed_time": "10:14:46", "remaining_time": "8:51:04"} +{"current_steps": 3790, "total_steps": 7064, "loss": 0.7934, "reward": null, "learning_rate": 2.213776342774595e-05, "epoch": 1.07, "percentage": 53.65, "elapsed_time": "10:10:51", "remaining_time": "8:47:41"} +{"current_steps": 3790, "total_steps": 7064, "loss": 0.7934, "reward": null, "learning_rate": 2.213776342774595e-05, "epoch": 1.07, "percentage": 53.65, "elapsed_time": "10:10:53", "remaining_time": "8:47:43"} +{"current_steps": 3800, "total_steps": 7064, "loss": 0.7975, "reward": null, "learning_rate": 2.2027339981361156e-05, "epoch": 1.08, "percentage": 53.79, "elapsed_time": "10:16:24", "remaining_time": "8:49:27"} +{"current_steps": 3800, "total_steps": 7064, "loss": 0.7975, "reward": null, "learning_rate": 2.2027339981361156e-05, "epoch": 1.08, "percentage": 53.79, "elapsed_time": "10:12:29", "remaining_time": "8:46:06"} +{"current_steps": 3800, "total_steps": 7064, "loss": 0.7975, "reward": null, "learning_rate": 2.2027339981361156e-05, "epoch": 1.08, "percentage": 53.79, "elapsed_time": "10:12:31", "remaining_time": "8:46:07"} +{"current_steps": 3800, "total_steps": 7064, "loss": 0.7975, "reward": null, "learning_rate": 2.2027339981361156e-05, "epoch": 1.08, "percentage": 53.79, "elapsed_time": "10:12:30", "remaining_time": "8:46:07"} +{"current_steps": 3810, "total_steps": 7064, "loss": 0.807, "reward": null, "learning_rate": 2.1916975330314235e-05, "epoch": 1.08, "percentage": 53.94, "elapsed_time": "10:14:03", "remaining_time": "8:44:26"} +{"current_steps": 3810, "total_steps": 7064, "loss": 0.807, "reward": null, "learning_rate": 2.1916975330314235e-05, "epoch": 1.08, "percentage": 53.94, "elapsed_time": "10:17:56", "remaining_time": "8:47:46"} +{"current_steps": 3810, "total_steps": 7064, "loss": 0.807, "reward": null, "learning_rate": 2.1916975330314235e-05, "epoch": 1.08, "percentage": 53.94, "elapsed_time": "10:14:03", "remaining_time": "8:44:27"} +{"current_steps": 3810, "total_steps": 7064, "loss": 0.807, "reward": null, "learning_rate": 2.1916975330314235e-05, "epoch": 1.08, "percentage": 53.94, "elapsed_time": "10:14:02", "remaining_time": "8:44:25"} +{"current_steps": 3820, "total_steps": 7064, "loss": 0.7754, "reward": null, "learning_rate": 2.1806671657474048e-05, "epoch": 1.08, "percentage": 54.08, "elapsed_time": "10:15:42", "remaining_time": "8:42:51"} +{"current_steps": 3820, "total_steps": 7064, "loss": 0.7754, "reward": null, "learning_rate": 2.1806671657474048e-05, "epoch": 1.08, "percentage": 54.08, "elapsed_time": "10:15:41", "remaining_time": "8:42:51"} +{"current_steps": 3820, "total_steps": 7064, "loss": 0.7754, "reward": null, "learning_rate": 2.1806671657474048e-05, "epoch": 1.08, "percentage": 54.08, "elapsed_time": "10:15:43", "remaining_time": "8:42:52"} +{"current_steps": 3820, "total_steps": 7064, "loss": 0.7754, "reward": null, "learning_rate": 2.1806671657474048e-05, "epoch": 1.08, "percentage": 54.08, "elapsed_time": "10:19:35", "remaining_time": "8:46:10"} +{"current_steps": 3830, "total_steps": 7064, "loss": 0.7977, "reward": null, "learning_rate": 2.1696431144503356e-05, "epoch": 1.08, "percentage": 54.22, "elapsed_time": "10:17:16", "remaining_time": "8:41:12"} +{"current_steps": 3830, "total_steps": 7064, "loss": 0.7977, "reward": null, "learning_rate": 2.1696431144503356e-05, "epoch": 1.08, "percentage": 54.22, "elapsed_time": "10:17:16", "remaining_time": "8:41:13"} +{"current_steps": 3830, "total_steps": 7064, "loss": 0.7977, "reward": null, "learning_rate": 2.1696431144503356e-05, "epoch": 1.08, "percentage": 54.22, "elapsed_time": "10:17:15", "remaining_time": "8:41:12"} +{"current_steps": 3830, "total_steps": 7064, "loss": 0.7977, "reward": null, "learning_rate": 2.1696431144503356e-05, "epoch": 1.08, "percentage": 54.22, "elapsed_time": "10:21:09", "remaining_time": "8:44:30"} +{"current_steps": 3840, "total_steps": 7064, "loss": 0.7922, "reward": null, "learning_rate": 2.1586255971815738e-05, "epoch": 1.09, "percentage": 54.36, "elapsed_time": "10:18:56", "remaining_time": "8:39:39"} +{"current_steps": 3840, "total_steps": 7064, "loss": 0.7922, "reward": null, "learning_rate": 2.1586255971815738e-05, "epoch": 1.09, "percentage": 54.36, "elapsed_time": "10:18:57", "remaining_time": "8:39:39"} +{"current_steps": 3840, "total_steps": 7064, "loss": 0.7922, "reward": null, "learning_rate": 2.1586255971815738e-05, "epoch": 1.09, "percentage": 54.36, "elapsed_time": "10:22:50", "remaining_time": "8:42:55"} +{"current_steps": 3840, "total_steps": 7064, "loss": 0.7922, "reward": null, "learning_rate": 2.1586255971815738e-05, "epoch": 1.09, "percentage": 54.36, "elapsed_time": "10:18:55", "remaining_time": "8:39:38"} +{"current_steps": 3850, "total_steps": 7064, "loss": 0.7862, "reward": null, "learning_rate": 2.147614831853239e-05, "epoch": 1.09, "percentage": 54.5, "elapsed_time": "10:20:33", "remaining_time": "8:38:03"} +{"current_steps": 3850, "total_steps": 7064, "loss": 0.7862, "reward": null, "learning_rate": 2.147614831853239e-05, "epoch": 1.09, "percentage": 54.5, "elapsed_time": "10:24:27", "remaining_time": "8:41:18"} +{"current_steps": 3850, "total_steps": 7064, "loss": 0.7862, "reward": null, "learning_rate": 2.147614831853239e-05, "epoch": 1.09, "percentage": 54.5, "elapsed_time": "10:20:34", "remaining_time": "8:38:03"} +{"current_steps": 3850, "total_steps": 7064, "loss": 0.7862, "reward": null, "learning_rate": 2.147614831853239e-05, "epoch": 1.09, "percentage": 54.5, "elapsed_time": "10:20:32", "remaining_time": "8:38:02"} +{"current_steps": 3860, "total_steps": 7064, "loss": 0.7918, "reward": null, "learning_rate": 2.136611036243908e-05, "epoch": 1.09, "percentage": 54.64, "elapsed_time": "10:22:10", "remaining_time": "8:36:25"} +{"current_steps": 3860, "total_steps": 7064, "loss": 0.7918, "reward": null, "learning_rate": 2.136611036243908e-05, "epoch": 1.09, "percentage": 54.64, "elapsed_time": "10:22:10", "remaining_time": "8:36:26"} +{"current_steps": 3860, "total_steps": 7064, "loss": 0.7918, "reward": null, "learning_rate": 2.136611036243908e-05, "epoch": 1.09, "percentage": 54.64, "elapsed_time": "10:22:09", "remaining_time": "8:36:25"} +{"current_steps": 3860, "total_steps": 7064, "loss": 0.7918, "reward": null, "learning_rate": 2.136611036243908e-05, "epoch": 1.09, "percentage": 54.64, "elapsed_time": "10:26:03", "remaining_time": "8:39:39"} +{"current_steps": 3870, "total_steps": 7064, "loss": 0.781, "reward": null, "learning_rate": 2.1256144279943066e-05, "epoch": 1.1, "percentage": 54.78, "elapsed_time": "10:27:39", "remaining_time": "8:38:01"} +{"current_steps": 3870, "total_steps": 7064, "loss": 0.781, "reward": null, "learning_rate": 2.1256144279943066e-05, "epoch": 1.1, "percentage": 54.78, "elapsed_time": "10:23:45", "remaining_time": "8:34:48"} +{"current_steps": 3870, "total_steps": 7064, "loss": 0.781, "reward": null, "learning_rate": 2.1256144279943066e-05, "epoch": 1.1, "percentage": 54.78, "elapsed_time": "10:23:47", "remaining_time": "8:34:49"} +{"current_steps": 3870, "total_steps": 7064, "loss": 0.781, "reward": null, "learning_rate": 2.1256144279943066e-05, "epoch": 1.1, "percentage": 54.78, "elapsed_time": "10:23:46", "remaining_time": "8:34:48"} +{"current_steps": 3880, "total_steps": 7064, "loss": 0.7786, "reward": null, "learning_rate": 2.114625224603002e-05, "epoch": 1.1, "percentage": 54.93, "elapsed_time": "10:25:29", "remaining_time": "8:33:17"} +{"current_steps": 3880, "total_steps": 7064, "loss": 0.7786, "reward": null, "learning_rate": 2.114625224603002e-05, "epoch": 1.1, "percentage": 54.93, "elapsed_time": "10:25:28", "remaining_time": "8:33:16"} +{"current_steps": 3880, "total_steps": 7064, "loss": 0.7786, "reward": null, "learning_rate": 2.114625224603002e-05, "epoch": 1.1, "percentage": 54.93, "elapsed_time": "10:29:22", "remaining_time": "8:36:28"} +{"current_steps": 3880, "total_steps": 7064, "loss": 0.7786, "reward": null, "learning_rate": 2.114625224603002e-05, "epoch": 1.1, "percentage": 54.93, "elapsed_time": "10:25:27", "remaining_time": "8:33:16"} +{"current_steps": 3890, "total_steps": 7064, "loss": 0.8067, "reward": null, "learning_rate": 2.1036436434221048e-05, "epoch": 1.1, "percentage": 55.07, "elapsed_time": "10:31:05", "remaining_time": "8:34:56"} +{"current_steps": 3890, "total_steps": 7064, "loss": 0.8067, "reward": null, "learning_rate": 2.1036436434221048e-05, "epoch": 1.1, "percentage": 55.07, "elapsed_time": "10:27:12", "remaining_time": "8:31:46"} +{"current_steps": 3890, "total_steps": 7064, "loss": 0.8067, "reward": null, "learning_rate": 2.1036436434221048e-05, "epoch": 1.1, "percentage": 55.07, "elapsed_time": "10:27:11", "remaining_time": "8:31:44"} +{"current_steps": 3890, "total_steps": 7064, "loss": 0.8067, "reward": null, "learning_rate": 2.1036436434221048e-05, "epoch": 1.1, "percentage": 55.07, "elapsed_time": "10:27:12", "remaining_time": "8:31:45"} +{"current_steps": 3900, "total_steps": 7064, "loss": 0.7755, "reward": null, "learning_rate": 2.0926699016529656e-05, "epoch": 1.1, "percentage": 55.21, "elapsed_time": "10:28:46", "remaining_time": "8:30:06"} +{"current_steps": 3900, "total_steps": 7064, "loss": 0.7755, "reward": null, "learning_rate": 2.0926699016529656e-05, "epoch": 1.1, "percentage": 55.21, "elapsed_time": "10:28:47", "remaining_time": "8:30:07"} +{"current_steps": 3900, "total_steps": 7064, "loss": 0.7755, "reward": null, "learning_rate": 2.0926699016529656e-05, "epoch": 1.1, "percentage": 55.21, "elapsed_time": "10:28:48", "remaining_time": "8:30:08"} +{"current_steps": 3900, "total_steps": 7064, "loss": 0.7755, "reward": null, "learning_rate": 2.0926699016529656e-05, "epoch": 1.1, "percentage": 55.21, "elapsed_time": "10:32:41", "remaining_time": "8:33:17"} +{"current_steps": 3910, "total_steps": 7064, "loss": 0.7958, "reward": null, "learning_rate": 2.0817042163418858e-05, "epoch": 1.11, "percentage": 55.35, "elapsed_time": "10:30:23", "remaining_time": "8:28:30"} +{"current_steps": 3910, "total_steps": 7064, "loss": 0.7958, "reward": null, "learning_rate": 2.0817042163418858e-05, "epoch": 1.11, "percentage": 55.35, "elapsed_time": "10:30:22", "remaining_time": "8:28:29"} +{"current_steps": 3910, "total_steps": 7064, "loss": 0.7958, "reward": null, "learning_rate": 2.0817042163418858e-05, "epoch": 1.11, "percentage": 55.35, "elapsed_time": "10:34:17", "remaining_time": "8:31:38"} +{"current_steps": 3910, "total_steps": 7064, "loss": 0.7958, "reward": null, "learning_rate": 2.0817042163418858e-05, "epoch": 1.11, "percentage": 55.35, "elapsed_time": "10:30:24", "remaining_time": "8:28:30"} +{"current_steps": 3920, "total_steps": 7064, "loss": 0.8064, "reward": null, "learning_rate": 2.0707468043758156e-05, "epoch": 1.11, "percentage": 55.49, "elapsed_time": "10:35:53", "remaining_time": "8:30:00"} +{"current_steps": 3920, "total_steps": 7064, "loss": 0.8064, "reward": null, "learning_rate": 2.0707468043758156e-05, "epoch": 1.11, "percentage": 55.49, "elapsed_time": "10:32:00", "remaining_time": "8:26:54"} +{"current_steps": 3920, "total_steps": 7064, "loss": 0.8064, "reward": null, "learning_rate": 2.0707468043758156e-05, "epoch": 1.11, "percentage": 55.49, "elapsed_time": "10:32:00", "remaining_time": "8:26:53"} +{"current_steps": 3920, "total_steps": 7064, "loss": 0.8064, "reward": null, "learning_rate": 2.0707468043758156e-05, "epoch": 1.11, "percentage": 55.49, "elapsed_time": "10:31:59", "remaining_time": "8:26:52"} +{"current_steps": 3930, "total_steps": 7064, "loss": 0.7967, "reward": null, "learning_rate": 2.059797882478074e-05, "epoch": 1.11, "percentage": 55.63, "elapsed_time": "10:33:35", "remaining_time": "8:25:15"} +{"current_steps": 3930, "total_steps": 7064, "loss": 0.7967, "reward": null, "learning_rate": 2.059797882478074e-05, "epoch": 1.11, "percentage": 55.63, "elapsed_time": "10:33:35", "remaining_time": "8:25:15"} +{"current_steps": 3930, "total_steps": 7064, "loss": 0.7967, "reward": null, "learning_rate": 2.059797882478074e-05, "epoch": 1.11, "percentage": 55.63, "elapsed_time": "10:33:34", "remaining_time": "8:25:14"} +{"current_steps": 3930, "total_steps": 7064, "loss": 0.7967, "reward": null, "learning_rate": 2.059797882478074e-05, "epoch": 1.11, "percentage": 55.63, "elapsed_time": "10:37:28", "remaining_time": "8:28:21"} +{"current_steps": 3940, "total_steps": 7064, "loss": 0.8107, "reward": null, "learning_rate": 2.048857667204053e-05, "epoch": 1.12, "percentage": 55.78, "elapsed_time": "10:35:15", "remaining_time": "8:23:41"} +{"current_steps": 3940, "total_steps": 7064, "loss": 0.8107, "reward": null, "learning_rate": 2.048857667204053e-05, "epoch": 1.12, "percentage": 55.78, "elapsed_time": "10:35:16", "remaining_time": "8:23:42"} +{"current_steps": 3940, "total_steps": 7064, "loss": 0.8107, "reward": null, "learning_rate": 2.048857667204053e-05, "epoch": 1.12, "percentage": 55.78, "elapsed_time": "10:39:09", "remaining_time": "8:26:47"} +{"current_steps": 3940, "total_steps": 7064, "loss": 0.8107, "reward": null, "learning_rate": 2.048857667204053e-05, "epoch": 1.12, "percentage": 55.78, "elapsed_time": "10:35:17", "remaining_time": "8:23:42"} +{"current_steps": 3950, "total_steps": 7064, "loss": 0.7857, "reward": null, "learning_rate": 2.0379263749369434e-05, "epoch": 1.12, "percentage": 55.92, "elapsed_time": "10:40:46", "remaining_time": "8:25:09"} +{"current_steps": 3950, "total_steps": 7064, "loss": 0.7857, "reward": null, "learning_rate": 2.0379263749369434e-05, "epoch": 1.12, "percentage": 55.92, "elapsed_time": "10:36:51", "remaining_time": "8:22:04"} +{"current_steps": 3950, "total_steps": 7064, "loss": 0.7857, "reward": null, "learning_rate": 2.0379263749369434e-05, "epoch": 1.12, "percentage": 55.92, "elapsed_time": "10:36:53", "remaining_time": "8:22:05"} +{"current_steps": 3950, "total_steps": 7064, "loss": 0.7857, "reward": null, "learning_rate": 2.0379263749369434e-05, "epoch": 1.12, "percentage": 55.92, "elapsed_time": "10:36:52", "remaining_time": "8:22:04"} +{"current_steps": 3960, "total_steps": 7064, "loss": 0.7732, "reward": null, "learning_rate": 2.027004221883447e-05, "epoch": 1.12, "percentage": 56.06, "elapsed_time": "10:38:28", "remaining_time": "8:20:27"} +{"current_steps": 3960, "total_steps": 7064, "loss": 0.7732, "reward": null, "learning_rate": 2.027004221883447e-05, "epoch": 1.12, "percentage": 56.06, "elapsed_time": "10:42:23", "remaining_time": "8:23:31"} +{"current_steps": 3960, "total_steps": 7064, "loss": 0.7732, "reward": null, "learning_rate": 2.027004221883447e-05, "epoch": 1.12, "percentage": 56.06, "elapsed_time": "10:38:30", "remaining_time": "8:20:29"} +{"current_steps": 3960, "total_steps": 7064, "loss": 0.7732, "reward": null, "learning_rate": 2.027004221883447e-05, "epoch": 1.12, "percentage": 56.06, "elapsed_time": "10:38:29", "remaining_time": "8:20:28"} +{"current_steps": 3970, "total_steps": 7064, "loss": 0.7768, "reward": null, "learning_rate": 2.016091424069506e-05, "epoch": 1.12, "percentage": 56.2, "elapsed_time": "10:40:04", "remaining_time": "8:18:50"} +{"current_steps": 3970, "total_steps": 7064, "loss": 0.7768, "reward": null, "learning_rate": 2.016091424069506e-05, "epoch": 1.12, "percentage": 56.2, "elapsed_time": "10:43:57", "remaining_time": "8:21:51"} +{"current_steps": 3970, "total_steps": 7064, "loss": 0.7768, "reward": null, "learning_rate": 2.016091424069506e-05, "epoch": 1.12, "percentage": 56.2, "elapsed_time": "10:40:02", "remaining_time": "8:18:49"} +{"current_steps": 3970, "total_steps": 7064, "loss": 0.7768, "reward": null, "learning_rate": 2.016091424069506e-05, "epoch": 1.12, "percentage": 56.2, "elapsed_time": "10:40:03", "remaining_time": "8:18:49"} +{"current_steps": 3980, "total_steps": 7064, "loss": 0.7839, "reward": null, "learning_rate": 2.0051881973360266e-05, "epoch": 1.13, "percentage": 56.34, "elapsed_time": "10:41:40", "remaining_time": "8:17:12"} +{"current_steps": 3980, "total_steps": 7064, "loss": 0.7839, "reward": null, "learning_rate": 2.0051881973360266e-05, "epoch": 1.13, "percentage": 56.34, "elapsed_time": "10:45:33", "remaining_time": "8:20:13"} +{"current_steps": 3980, "total_steps": 7064, "loss": 0.7839, "reward": null, "learning_rate": 2.0051881973360266e-05, "epoch": 1.13, "percentage": 56.34, "elapsed_time": "10:41:40", "remaining_time": "8:17:13"} +{"current_steps": 3980, "total_steps": 7064, "loss": 0.7839, "reward": null, "learning_rate": 2.0051881973360266e-05, "epoch": 1.13, "percentage": 56.34, "elapsed_time": "10:41:39", "remaining_time": "8:17:12"} +{"current_steps": 3990, "total_steps": 7064, "loss": 0.7923, "reward": null, "learning_rate": 1.9942947573346133e-05, "epoch": 1.13, "percentage": 56.48, "elapsed_time": "10:47:11", "remaining_time": "8:18:36"} +{"current_steps": 3990, "total_steps": 7064, "loss": 0.7923, "reward": null, "learning_rate": 1.9942947573346133e-05, "epoch": 1.13, "percentage": 56.48, "elapsed_time": "10:43:18", "remaining_time": "8:15:37"} +{"current_steps": 3990, "total_steps": 7064, "loss": 0.7923, "reward": null, "learning_rate": 1.9942947573346133e-05, "epoch": 1.13, "percentage": 56.48, "elapsed_time": "10:43:17", "remaining_time": "8:15:36"} +{"current_steps": 3990, "total_steps": 7064, "loss": 0.7923, "reward": null, "learning_rate": 1.9942947573346133e-05, "epoch": 1.13, "percentage": 56.48, "elapsed_time": "10:43:16", "remaining_time": "8:15:36"} +{"current_steps": 4000, "total_steps": 7064, "loss": 0.7994, "reward": null, "learning_rate": 1.9834113195233e-05, "epoch": 1.13, "percentage": 56.63, "elapsed_time": "10:44:53", "remaining_time": "8:13:59"} +{"current_steps": 4000, "total_steps": 7064, "loss": 0.7994, "reward": null, "learning_rate": 1.9834113195233e-05, "epoch": 1.13, "percentage": 56.63, "elapsed_time": "10:48:48", "remaining_time": "8:16:59"} +{"current_steps": 4000, "total_steps": 7064, "loss": 0.7994, "reward": null, "learning_rate": 1.9834113195233e-05, "epoch": 1.13, "percentage": 56.63, "elapsed_time": "10:44:55", "remaining_time": "8:14:00"} +{"current_steps": 4000, "total_steps": 7064, "loss": 0.7994, "reward": null, "learning_rate": 1.9834113195233e-05, "epoch": 1.13, "percentage": 56.63, "elapsed_time": "10:44:54", "remaining_time": "8:14:00"} +{"current_steps": 4010, "total_steps": 7064, "loss": 0.7907, "reward": null, "learning_rate": 1.9725380991622923e-05, "epoch": 1.14, "percentage": 56.77, "elapsed_time": "10:50:30", "remaining_time": "8:15:25"} +{"current_steps": 4010, "total_steps": 7064, "loss": 0.7907, "reward": null, "learning_rate": 1.9725380991622923e-05, "epoch": 1.14, "percentage": 56.77, "elapsed_time": "10:46:35", "remaining_time": "8:12:26"} +{"current_steps": 4010, "total_steps": 7064, "loss": 0.7907, "reward": null, "learning_rate": 1.9725380991622923e-05, "epoch": 1.14, "percentage": 56.77, "elapsed_time": "10:46:37", "remaining_time": "8:12:28"} +{"current_steps": 4010, "total_steps": 7064, "loss": 0.7907, "reward": null, "learning_rate": 1.9725380991622923e-05, "epoch": 1.14, "percentage": 56.77, "elapsed_time": "10:46:36", "remaining_time": "8:12:27"} +{"current_steps": 4020, "total_steps": 7064, "loss": 0.7908, "reward": null, "learning_rate": 1.961675311309705e-05, "epoch": 1.14, "percentage": 56.91, "elapsed_time": "10:48:12", "remaining_time": "8:10:50"} +{"current_steps": 4020, "total_steps": 7064, "loss": 0.7908, "reward": null, "learning_rate": 1.961675311309705e-05, "epoch": 1.14, "percentage": 56.91, "elapsed_time": "10:48:11", "remaining_time": "8:10:48"} +{"current_steps": 4020, "total_steps": 7064, "loss": 0.7908, "reward": null, "learning_rate": 1.961675311309705e-05, "epoch": 1.14, "percentage": 56.91, "elapsed_time": "10:48:11", "remaining_time": "8:10:49"} +{"current_steps": 4020, "total_steps": 7064, "loss": 0.7908, "reward": null, "learning_rate": 1.961675311309705e-05, "epoch": 1.14, "percentage": 56.91, "elapsed_time": "10:52:05", "remaining_time": "8:13:46"} +{"current_steps": 4030, "total_steps": 7064, "loss": 0.7731, "reward": null, "learning_rate": 1.9508231708173146e-05, "epoch": 1.14, "percentage": 57.05, "elapsed_time": "10:49:47", "remaining_time": "8:09:11"} +{"current_steps": 4030, "total_steps": 7064, "loss": 0.7731, "reward": null, "learning_rate": 1.9508231708173146e-05, "epoch": 1.14, "percentage": 57.05, "elapsed_time": "10:53:41", "remaining_time": "8:12:07"} +{"current_steps": 4030, "total_steps": 7064, "loss": 0.7731, "reward": null, "learning_rate": 1.9508231708173146e-05, "epoch": 1.14, "percentage": 57.05, "elapsed_time": "10:49:48", "remaining_time": "8:09:12"} +{"current_steps": 4030, "total_steps": 7064, "loss": 0.7731, "reward": null, "learning_rate": 1.9508231708173146e-05, "epoch": 1.14, "percentage": 57.05, "elapsed_time": "10:49:46", "remaining_time": "8:09:11"} +{"current_steps": 4040, "total_steps": 7064, "loss": 0.7769, "reward": null, "learning_rate": 1.9399818923263056e-05, "epoch": 1.14, "percentage": 57.19, "elapsed_time": "10:51:24", "remaining_time": "8:07:35"} +{"current_steps": 4040, "total_steps": 7064, "loss": 0.7769, "reward": null, "learning_rate": 1.9399818923263056e-05, "epoch": 1.14, "percentage": 57.19, "elapsed_time": "10:55:19", "remaining_time": "8:10:30"} +{"current_steps": 4040, "total_steps": 7064, "loss": 0.7769, "reward": null, "learning_rate": 1.9399818923263056e-05, "epoch": 1.14, "percentage": 57.19, "elapsed_time": "10:51:26", "remaining_time": "8:07:36"} +{"current_steps": 4040, "total_steps": 7064, "loss": 0.7769, "reward": null, "learning_rate": 1.9399818923263056e-05, "epoch": 1.14, "percentage": 57.19, "elapsed_time": "10:51:25", "remaining_time": "8:07:35"} +{"current_steps": 4050, "total_steps": 7064, "loss": 0.795, "reward": null, "learning_rate": 1.929151690263026e-05, "epoch": 1.15, "percentage": 57.33, "elapsed_time": "10:53:06", "remaining_time": "8:06:02"} +{"current_steps": 4050, "total_steps": 7064, "loss": 0.795, "reward": null, "learning_rate": 1.929151690263026e-05, "epoch": 1.15, "percentage": 57.33, "elapsed_time": "10:53:05", "remaining_time": "8:06:01"} +{"current_steps": 4050, "total_steps": 7064, "loss": 0.795, "reward": null, "learning_rate": 1.929151690263026e-05, "epoch": 1.15, "percentage": 57.33, "elapsed_time": "10:53:04", "remaining_time": "8:06:01"} +{"current_steps": 4050, "total_steps": 7064, "loss": 0.795, "reward": null, "learning_rate": 1.929151690263026e-05, "epoch": 1.15, "percentage": 57.33, "elapsed_time": "10:56:59", "remaining_time": "8:08:55"} +{"current_steps": 4060, "total_steps": 7064, "loss": 0.8147, "reward": null, "learning_rate": 1.918332778834745e-05, "epoch": 1.15, "percentage": 57.47, "elapsed_time": "10:58:36", "remaining_time": "8:07:18"} +{"current_steps": 4060, "total_steps": 7064, "loss": 0.8147, "reward": null, "learning_rate": 1.918332778834745e-05, "epoch": 1.15, "percentage": 57.47, "elapsed_time": "10:54:43", "remaining_time": "8:04:26"} +{"current_steps": 4060, "total_steps": 7064, "loss": 0.8147, "reward": null, "learning_rate": 1.918332778834745e-05, "epoch": 1.15, "percentage": 57.47, "elapsed_time": "10:54:43", "remaining_time": "8:04:25"} +{"current_steps": 4060, "total_steps": 7064, "loss": 0.8147, "reward": null, "learning_rate": 1.918332778834745e-05, "epoch": 1.15, "percentage": 57.47, "elapsed_time": "10:54:42", "remaining_time": "8:04:25"} +{"current_steps": 4070, "total_steps": 7064, "loss": 0.8065, "reward": null, "learning_rate": 1.9075253720254217e-05, "epoch": 1.15, "percentage": 57.62, "elapsed_time": "10:56:19", "remaining_time": "8:02:48"} +{"current_steps": 4070, "total_steps": 7064, "loss": 0.8065, "reward": null, "learning_rate": 1.9075253720254217e-05, "epoch": 1.15, "percentage": 57.62, "elapsed_time": "11:00:12", "remaining_time": "8:05:40"} +{"current_steps": 4070, "total_steps": 7064, "loss": 0.8065, "reward": null, "learning_rate": 1.9075253720254217e-05, "epoch": 1.15, "percentage": 57.62, "elapsed_time": "10:56:18", "remaining_time": "8:02:47"} +{"current_steps": 4070, "total_steps": 7064, "loss": 0.8065, "reward": null, "learning_rate": 1.9075253720254217e-05, "epoch": 1.15, "percentage": 57.62, "elapsed_time": "10:56:19", "remaining_time": "8:02:48"} +{"current_steps": 4080, "total_steps": 7064, "loss": 0.7879, "reward": null, "learning_rate": 1.8967296835914643e-05, "epoch": 1.16, "percentage": 57.76, "elapsed_time": "10:57:54", "remaining_time": "8:01:10"} +{"current_steps": 4080, "total_steps": 7064, "loss": 0.7879, "reward": null, "learning_rate": 1.8967296835914643e-05, "epoch": 1.16, "percentage": 57.76, "elapsed_time": "11:01:47", "remaining_time": "8:04:01"} +{"current_steps": 4080, "total_steps": 7064, "loss": 0.7879, "reward": null, "learning_rate": 1.8967296835914643e-05, "epoch": 1.16, "percentage": 57.76, "elapsed_time": "10:57:54", "remaining_time": "8:01:10"} +{"current_steps": 4080, "total_steps": 7064, "loss": 0.7879, "reward": null, "learning_rate": 1.8967296835914643e-05, "epoch": 1.16, "percentage": 57.76, "elapsed_time": "10:57:53", "remaining_time": "8:01:09"} +{"current_steps": 4090, "total_steps": 7064, "loss": 0.7755, "reward": null, "learning_rate": 1.885945927057511e-05, "epoch": 1.16, "percentage": 57.9, "elapsed_time": "10:59:35", "remaining_time": "7:59:36"} +{"current_steps": 4090, "total_steps": 7064, "loss": 0.7755, "reward": null, "learning_rate": 1.885945927057511e-05, "epoch": 1.16, "percentage": 57.9, "elapsed_time": "11:03:30", "remaining_time": "8:02:27"} +{"current_steps": 4090, "total_steps": 7064, "loss": 0.7755, "reward": null, "learning_rate": 1.885945927057511e-05, "epoch": 1.16, "percentage": 57.9, "elapsed_time": "10:59:37", "remaining_time": "7:59:38"} +{"current_steps": 4090, "total_steps": 7064, "loss": 0.7755, "reward": null, "learning_rate": 1.885945927057511e-05, "epoch": 1.16, "percentage": 57.9, "elapsed_time": "10:59:36", "remaining_time": "7:59:37"} +{"current_steps": 4100, "total_steps": 7064, "loss": 0.7852, "reward": null, "learning_rate": 1.8751743157122003e-05, "epoch": 1.16, "percentage": 58.04, "elapsed_time": "11:05:07", "remaining_time": "8:00:50"} +{"current_steps": 4100, "total_steps": 7064, "loss": 0.7852, "reward": null, "learning_rate": 1.8751743157122003e-05, "epoch": 1.16, "percentage": 58.04, "elapsed_time": "11:01:13", "remaining_time": "7:58:01"} +{"current_steps": 4100, "total_steps": 7064, "loss": 0.7852, "reward": null, "learning_rate": 1.8751743157122003e-05, "epoch": 1.16, "percentage": 58.04, "elapsed_time": "11:01:14", "remaining_time": "7:58:01"} +{"current_steps": 4100, "total_steps": 7064, "loss": 0.7852, "reward": null, "learning_rate": 1.8751743157122003e-05, "epoch": 1.16, "percentage": 58.04, "elapsed_time": "11:01:13", "remaining_time": "7:58:00"} +{"current_steps": 4110, "total_steps": 7064, "loss": 0.7912, "reward": null, "learning_rate": 1.8644150626039534e-05, "epoch": 1.16, "percentage": 58.18, "elapsed_time": "11:02:55", "remaining_time": "7:56:28"} +{"current_steps": 4110, "total_steps": 7064, "loss": 0.7912, "reward": null, "learning_rate": 1.8644150626039534e-05, "epoch": 1.16, "percentage": 58.18, "elapsed_time": "11:06:48", "remaining_time": "7:59:15"} +{"current_steps": 4110, "total_steps": 7064, "loss": 0.7912, "reward": null, "learning_rate": 1.8644150626039534e-05, "epoch": 1.16, "percentage": 58.18, "elapsed_time": "11:02:54", "remaining_time": "7:56:27"} +{"current_steps": 4110, "total_steps": 7064, "loss": 0.7912, "reward": null, "learning_rate": 1.8644150626039534e-05, "epoch": 1.16, "percentage": 58.18, "elapsed_time": "11:02:55", "remaining_time": "7:56:27"} +{"current_steps": 4120, "total_steps": 7064, "loss": 0.7934, "reward": null, "learning_rate": 1.8536683805367656e-05, "epoch": 1.17, "percentage": 58.32, "elapsed_time": "11:04:34", "remaining_time": "7:54:53"} +{"current_steps": 4120, "total_steps": 7064, "loss": 0.7934, "reward": null, "learning_rate": 1.8536683805367656e-05, "epoch": 1.17, "percentage": 58.32, "elapsed_time": "11:08:29", "remaining_time": "7:57:40"} +{"current_steps": 4120, "total_steps": 7064, "loss": 0.7934, "reward": null, "learning_rate": 1.8536683805367656e-05, "epoch": 1.17, "percentage": 58.32, "elapsed_time": "11:04:36", "remaining_time": "7:54:54"} +{"current_steps": 4120, "total_steps": 7064, "loss": 0.7934, "reward": null, "learning_rate": 1.8536683805367656e-05, "epoch": 1.17, "percentage": 58.32, "elapsed_time": "11:04:35", "remaining_time": "7:54:53"} +{"current_steps": 4130, "total_steps": 7064, "loss": 0.7966, "reward": null, "learning_rate": 1.8429344820659892e-05, "epoch": 1.17, "percentage": 58.47, "elapsed_time": "11:06:11", "remaining_time": "7:53:16"} +{"current_steps": 4130, "total_steps": 7064, "loss": 0.7966, "reward": null, "learning_rate": 1.8429344820659892e-05, "epoch": 1.17, "percentage": 58.47, "elapsed_time": "11:10:05", "remaining_time": "7:56:02"} +{"current_steps": 4130, "total_steps": 7064, "loss": 0.7966, "reward": null, "learning_rate": 1.8429344820659892e-05, "epoch": 1.17, "percentage": 58.47, "elapsed_time": "11:06:10", "remaining_time": "7:53:15"} +{"current_steps": 4130, "total_steps": 7064, "loss": 0.7966, "reward": null, "learning_rate": 1.8429344820659892e-05, "epoch": 1.17, "percentage": 58.47, "elapsed_time": "11:06:12", "remaining_time": "7:53:16"} +{"current_steps": 4140, "total_steps": 7064, "loss": 0.7976, "reward": null, "learning_rate": 1.832213579494137e-05, "epoch": 1.17, "percentage": 58.61, "elapsed_time": "11:07:49", "remaining_time": "7:51:40"} +{"current_steps": 4140, "total_steps": 7064, "loss": 0.7976, "reward": null, "learning_rate": 1.832213579494137e-05, "epoch": 1.17, "percentage": 58.61, "elapsed_time": "11:07:48", "remaining_time": "7:51:39"} +{"current_steps": 4140, "total_steps": 7064, "loss": 0.7976, "reward": null, "learning_rate": 1.832213579494137e-05, "epoch": 1.17, "percentage": 58.61, "elapsed_time": "11:07:50", "remaining_time": "7:51:40"} +{"current_steps": 4140, "total_steps": 7064, "loss": 0.7976, "reward": null, "learning_rate": 1.832213579494137e-05, "epoch": 1.17, "percentage": 58.61, "elapsed_time": "11:11:43", "remaining_time": "7:54:25"} +{"current_steps": 4150, "total_steps": 7064, "loss": 0.7843, "reward": null, "learning_rate": 1.8215058848666765e-05, "epoch": 1.17, "percentage": 58.75, "elapsed_time": "11:13:21", "remaining_time": "7:52:48"} +{"current_steps": 4150, "total_steps": 7064, "loss": 0.7843, "reward": null, "learning_rate": 1.8215058848666765e-05, "epoch": 1.17, "percentage": 58.75, "elapsed_time": "11:09:28", "remaining_time": "7:50:05"} +{"current_steps": 4150, "total_steps": 7064, "loss": 0.7843, "reward": null, "learning_rate": 1.8215058848666765e-05, "epoch": 1.17, "percentage": 58.75, "elapsed_time": "11:09:26", "remaining_time": "7:50:03"} +{"current_steps": 4150, "total_steps": 7064, "loss": 0.7843, "reward": null, "learning_rate": 1.8215058848666765e-05, "epoch": 1.17, "percentage": 58.75, "elapsed_time": "11:09:27", "remaining_time": "7:50:04"} +{"current_steps": 4160, "total_steps": 7064, "loss": 0.7848, "reward": null, "learning_rate": 1.810811609967844e-05, "epoch": 1.18, "percentage": 58.89, "elapsed_time": "11:11:06", "remaining_time": "7:48:29"} +{"current_steps": 4160, "total_steps": 7064, "loss": 0.7848, "reward": null, "learning_rate": 1.810811609967844e-05, "epoch": 1.18, "percentage": 58.89, "elapsed_time": "11:15:01", "remaining_time": "7:51:13"} +{"current_steps": 4160, "total_steps": 7064, "loss": 0.7848, "reward": null, "learning_rate": 1.810811609967844e-05, "epoch": 1.18, "percentage": 58.89, "elapsed_time": "11:11:08", "remaining_time": "7:48:30"} +{"current_steps": 4160, "total_steps": 7064, "loss": 0.7848, "reward": null, "learning_rate": 1.810811609967844e-05, "epoch": 1.18, "percentage": 58.89, "elapsed_time": "11:11:07", "remaining_time": "7:48:30"} +{"current_steps": 4170, "total_steps": 7064, "loss": 0.7675, "reward": null, "learning_rate": 1.8001309663164457e-05, "epoch": 1.18, "percentage": 59.03, "elapsed_time": "11:12:42", "remaining_time": "7:46:51"} +{"current_steps": 4170, "total_steps": 7064, "loss": 0.7675, "reward": null, "learning_rate": 1.8001309663164457e-05, "epoch": 1.18, "percentage": 59.03, "elapsed_time": "11:12:43", "remaining_time": "7:46:52"} +{"current_steps": 4170, "total_steps": 7064, "loss": 0.7675, "reward": null, "learning_rate": 1.8001309663164457e-05, "epoch": 1.18, "percentage": 59.03, "elapsed_time": "11:12:43", "remaining_time": "7:46:52"} +{"current_steps": 4170, "total_steps": 7064, "loss": 0.7675, "reward": null, "learning_rate": 1.8001309663164457e-05, "epoch": 1.18, "percentage": 59.03, "elapsed_time": "11:16:36", "remaining_time": "7:49:34"} +{"current_steps": 4180, "total_steps": 7064, "loss": 0.8059, "reward": null, "learning_rate": 1.7894641651616838e-05, "epoch": 1.18, "percentage": 59.17, "elapsed_time": "11:14:20", "remaining_time": "7:45:15"} +{"current_steps": 4180, "total_steps": 7064, "loss": 0.8059, "reward": null, "learning_rate": 1.7894641651616838e-05, "epoch": 1.18, "percentage": 59.17, "elapsed_time": "11:18:14", "remaining_time": "7:47:57"} +{"current_steps": 4180, "total_steps": 7064, "loss": 0.8059, "reward": null, "learning_rate": 1.7894641651616838e-05, "epoch": 1.18, "percentage": 59.17, "elapsed_time": "11:14:21", "remaining_time": "7:45:16"} +{"current_steps": 4180, "total_steps": 7064, "loss": 0.8059, "reward": null, "learning_rate": 1.7894641651616838e-05, "epoch": 1.18, "percentage": 59.17, "elapsed_time": "11:14:19", "remaining_time": "7:45:15"} +{"current_steps": 4190, "total_steps": 7064, "loss": 0.7871, "reward": null, "learning_rate": 1.7788114174789706e-05, "epoch": 1.19, "percentage": 59.31, "elapsed_time": "11:19:52", "remaining_time": "7:46:20"} +{"current_steps": 4190, "total_steps": 7064, "loss": 0.7871, "reward": null, "learning_rate": 1.7788114174789706e-05, "epoch": 1.19, "percentage": 59.31, "elapsed_time": "11:15:59", "remaining_time": "7:43:40"} +{"current_steps": 4190, "total_steps": 7064, "loss": 0.7871, "reward": null, "learning_rate": 1.7788114174789706e-05, "epoch": 1.19, "percentage": 59.31, "elapsed_time": "11:15:58", "remaining_time": "7:43:40"} +{"current_steps": 4190, "total_steps": 7064, "loss": 0.7871, "reward": null, "learning_rate": 1.7788114174789706e-05, "epoch": 1.19, "percentage": 59.31, "elapsed_time": "11:15:58", "remaining_time": "7:43:39"} +{"current_steps": 4200, "total_steps": 7064, "loss": 0.776, "reward": null, "learning_rate": 1.7681729339657626e-05, "epoch": 1.19, "percentage": 59.46, "elapsed_time": "11:17:36", "remaining_time": "7:42:04"} +{"current_steps": 4200, "total_steps": 7064, "loss": 0.776, "reward": null, "learning_rate": 1.7681729339657626e-05, "epoch": 1.19, "percentage": 59.46, "elapsed_time": "11:17:38", "remaining_time": "7:42:05"} +{"current_steps": 4200, "total_steps": 7064, "loss": 0.776, "reward": null, "learning_rate": 1.7681729339657626e-05, "epoch": 1.19, "percentage": 59.46, "elapsed_time": "11:21:31", "remaining_time": "7:44:44"} +{"current_steps": 4200, "total_steps": 7064, "loss": 0.776, "reward": null, "learning_rate": 1.7681729339657626e-05, "epoch": 1.19, "percentage": 59.46, "elapsed_time": "11:17:37", "remaining_time": "7:42:04"} +{"current_steps": 4210, "total_steps": 7064, "loss": 0.7911, "reward": null, "learning_rate": 1.7575489250373867e-05, "epoch": 1.19, "percentage": 59.6, "elapsed_time": "11:19:12", "remaining_time": "7:40:26"} +{"current_steps": 4210, "total_steps": 7064, "loss": 0.7911, "reward": null, "learning_rate": 1.7575489250373867e-05, "epoch": 1.19, "percentage": 59.6, "elapsed_time": "11:19:13", "remaining_time": "7:40:27"} +{"current_steps": 4210, "total_steps": 7064, "loss": 0.7911, "reward": null, "learning_rate": 1.7575489250373867e-05, "epoch": 1.19, "percentage": 59.6, "elapsed_time": "11:19:14", "remaining_time": "7:40:27"} +{"current_steps": 4210, "total_steps": 7064, "loss": 0.7911, "reward": null, "learning_rate": 1.7575489250373867e-05, "epoch": 1.19, "percentage": 59.6, "elapsed_time": "11:23:07", "remaining_time": "7:43:05"} +{"current_steps": 4220, "total_steps": 7064, "loss": 0.7934, "reward": null, "learning_rate": 1.746939600822883e-05, "epoch": 1.19, "percentage": 59.74, "elapsed_time": "11:20:54", "remaining_time": "7:38:53"} +{"current_steps": 4220, "total_steps": 7064, "loss": 0.7934, "reward": null, "learning_rate": 1.746939600822883e-05, "epoch": 1.19, "percentage": 59.74, "elapsed_time": "11:20:55", "remaining_time": "7:38:54"} +{"current_steps": 4220, "total_steps": 7064, "loss": 0.7934, "reward": null, "learning_rate": 1.746939600822883e-05, "epoch": 1.19, "percentage": 59.74, "elapsed_time": "11:20:56", "remaining_time": "7:38:54"} +{"current_steps": 4220, "total_steps": 7064, "loss": 0.7934, "reward": null, "learning_rate": 1.746939600822883e-05, "epoch": 1.19, "percentage": 59.74, "elapsed_time": "11:24:49", "remaining_time": "7:41:31"} +{"current_steps": 4230, "total_steps": 7064, "loss": 0.7922, "reward": null, "learning_rate": 1.7363451711608445e-05, "epoch": 1.2, "percentage": 59.88, "elapsed_time": "11:22:30", "remaining_time": "7:37:16"} +{"current_steps": 4230, "total_steps": 7064, "loss": 0.7922, "reward": null, "learning_rate": 1.7363451711608445e-05, "epoch": 1.2, "percentage": 59.88, "elapsed_time": "11:22:31", "remaining_time": "7:37:16"} +{"current_steps": 4230, "total_steps": 7064, "loss": 0.7922, "reward": null, "learning_rate": 1.7363451711608445e-05, "epoch": 1.2, "percentage": 59.88, "elapsed_time": "11:22:32", "remaining_time": "7:37:17"} +{"current_steps": 4230, "total_steps": 7064, "loss": 0.7922, "reward": null, "learning_rate": 1.7363451711608445e-05, "epoch": 1.2, "percentage": 59.88, "elapsed_time": "11:26:25", "remaining_time": "7:39:53"} +{"current_steps": 4240, "total_steps": 7064, "loss": 0.7931, "reward": null, "learning_rate": 1.7257658455952747e-05, "epoch": 1.2, "percentage": 60.02, "elapsed_time": "11:24:08", "remaining_time": "7:35:39"} +{"current_steps": 4240, "total_steps": 7064, "loss": 0.7931, "reward": null, "learning_rate": 1.7257658455952747e-05, "epoch": 1.2, "percentage": 60.02, "elapsed_time": "11:24:09", "remaining_time": "7:35:40"} +{"current_steps": 4240, "total_steps": 7064, "loss": 0.7931, "reward": null, "learning_rate": 1.7257658455952747e-05, "epoch": 1.2, "percentage": 60.02, "elapsed_time": "11:28:02", "remaining_time": "7:38:15"} +{"current_steps": 4240, "total_steps": 7064, "loss": 0.7931, "reward": null, "learning_rate": 1.7257658455952747e-05, "epoch": 1.2, "percentage": 60.02, "elapsed_time": "11:24:08", "remaining_time": "7:35:40"} +{"current_steps": 4250, "total_steps": 7064, "loss": 0.7926, "reward": null, "learning_rate": 1.715201833371432e-05, "epoch": 1.2, "percentage": 60.16, "elapsed_time": "11:29:43", "remaining_time": "7:36:40"} +{"current_steps": 4250, "total_steps": 7064, "loss": 0.7926, "reward": null, "learning_rate": 1.715201833371432e-05, "epoch": 1.2, "percentage": 60.16, "elapsed_time": "11:25:49", "remaining_time": "7:34:05"} +{"current_steps": 4250, "total_steps": 7064, "loss": 0.7926, "reward": null, "learning_rate": 1.715201833371432e-05, "epoch": 1.2, "percentage": 60.16, "elapsed_time": "11:25:48", "remaining_time": "7:34:05"} +{"current_steps": 4250, "total_steps": 7064, "loss": 0.7926, "reward": null, "learning_rate": 1.715201833371432e-05, "epoch": 1.2, "percentage": 60.16, "elapsed_time": "11:25:50", "remaining_time": "7:34:06"} +{"current_steps": 4260, "total_steps": 7064, "loss": 0.7881, "reward": null, "learning_rate": 1.7046533434317008e-05, "epoch": 1.21, "percentage": 60.31, "elapsed_time": "11:31:15", "remaining_time": "7:34:59"} +{"current_steps": 4260, "total_steps": 7064, "loss": 0.7881, "reward": null, "learning_rate": 1.7046533434317008e-05, "epoch": 1.21, "percentage": 60.31, "elapsed_time": "11:27:21", "remaining_time": "7:32:26"} +{"current_steps": 4260, "total_steps": 7064, "loss": 0.7881, "reward": null, "learning_rate": 1.7046533434317008e-05, "epoch": 1.21, "percentage": 60.31, "elapsed_time": "11:27:22", "remaining_time": "7:32:26"} +{"current_steps": 4260, "total_steps": 7064, "loss": 0.7881, "reward": null, "learning_rate": 1.7046533434317008e-05, "epoch": 1.21, "percentage": 60.31, "elapsed_time": "11:27:21", "remaining_time": "7:32:25"} +{"current_steps": 4270, "total_steps": 7064, "loss": 0.7842, "reward": null, "learning_rate": 1.6941205844114522e-05, "epoch": 1.21, "percentage": 60.45, "elapsed_time": "11:29:02", "remaining_time": "7:30:51"} +{"current_steps": 4270, "total_steps": 7064, "loss": 0.7842, "reward": null, "learning_rate": 1.6941205844114522e-05, "epoch": 1.21, "percentage": 60.45, "elapsed_time": "11:32:55", "remaining_time": "7:33:24"} +{"current_steps": 4270, "total_steps": 7064, "loss": 0.7842, "reward": null, "learning_rate": 1.6941205844114522e-05, "epoch": 1.21, "percentage": 60.45, "elapsed_time": "11:29:02", "remaining_time": "7:30:51"} +{"current_steps": 4270, "total_steps": 7064, "loss": 0.7842, "reward": null, "learning_rate": 1.6941205844114522e-05, "epoch": 1.21, "percentage": 60.45, "elapsed_time": "11:29:01", "remaining_time": "7:30:50"} +{"current_steps": 4280, "total_steps": 7064, "loss": 0.7807, "reward": null, "learning_rate": 1.683603764634923e-05, "epoch": 1.21, "percentage": 60.59, "elapsed_time": "11:30:39", "remaining_time": "7:29:15"} +{"current_steps": 4280, "total_steps": 7064, "loss": 0.7807, "reward": null, "learning_rate": 1.683603764634923e-05, "epoch": 1.21, "percentage": 60.59, "elapsed_time": "11:30:40", "remaining_time": "7:29:15"} +{"current_steps": 4280, "total_steps": 7064, "loss": 0.7807, "reward": null, "learning_rate": 1.683603764634923e-05, "epoch": 1.21, "percentage": 60.59, "elapsed_time": "11:30:41", "remaining_time": "7:29:16"} +{"current_steps": 4280, "total_steps": 7064, "loss": 0.7807, "reward": null, "learning_rate": 1.683603764634923e-05, "epoch": 1.21, "percentage": 60.59, "elapsed_time": "11:34:34", "remaining_time": "7:31:47"} +{"current_steps": 4290, "total_steps": 7064, "loss": 0.7926, "reward": null, "learning_rate": 1.6731030921110903e-05, "epoch": 1.21, "percentage": 60.73, "elapsed_time": "11:32:16", "remaining_time": "7:27:38"} +{"current_steps": 4290, "total_steps": 7064, "loss": 0.7926, "reward": null, "learning_rate": 1.6731030921110903e-05, "epoch": 1.21, "percentage": 60.73, "elapsed_time": "11:36:09", "remaining_time": "7:30:08"} +{"current_steps": 4290, "total_steps": 7064, "loss": 0.7926, "reward": null, "learning_rate": 1.6731030921110903e-05, "epoch": 1.21, "percentage": 60.73, "elapsed_time": "11:32:15", "remaining_time": "7:27:37"} +{"current_steps": 4290, "total_steps": 7064, "loss": 0.7926, "reward": null, "learning_rate": 1.6731030921110903e-05, "epoch": 1.21, "percentage": 60.73, "elapsed_time": "11:32:14", "remaining_time": "7:27:37"} +{"current_steps": 4300, "total_steps": 7064, "loss": 0.7878, "reward": null, "learning_rate": 1.6626187745295608e-05, "epoch": 1.22, "percentage": 60.87, "elapsed_time": "11:33:53", "remaining_time": "7:26:01"} +{"current_steps": 4300, "total_steps": 7064, "loss": 0.7878, "reward": null, "learning_rate": 1.6626187745295608e-05, "epoch": 1.22, "percentage": 60.87, "elapsed_time": "11:33:53", "remaining_time": "7:26:01"} +{"current_steps": 4300, "total_steps": 7064, "loss": 0.7878, "reward": null, "learning_rate": 1.6626187745295608e-05, "epoch": 1.22, "percentage": 60.87, "elapsed_time": "11:37:47", "remaining_time": "7:28:32"} +{"current_steps": 4300, "total_steps": 7064, "loss": 0.7878, "reward": null, "learning_rate": 1.6626187745295608e-05, "epoch": 1.22, "percentage": 60.87, "elapsed_time": "11:33:54", "remaining_time": "7:26:02"} +{"current_steps": 4310, "total_steps": 7064, "loss": 0.7843, "reward": null, "learning_rate": 1.65215101925646e-05, "epoch": 1.22, "percentage": 61.01, "elapsed_time": "11:39:23", "remaining_time": "7:26:53"} +{"current_steps": 4310, "total_steps": 7064, "loss": 0.7843, "reward": null, "learning_rate": 1.65215101925646e-05, "epoch": 1.22, "percentage": 61.01, "elapsed_time": "11:35:29", "remaining_time": "7:24:24"} +{"current_steps": 4310, "total_steps": 7064, "loss": 0.7843, "reward": null, "learning_rate": 1.65215101925646e-05, "epoch": 1.22, "percentage": 61.01, "elapsed_time": "11:35:30", "remaining_time": "7:24:24"} +{"current_steps": 4310, "total_steps": 7064, "loss": 0.7843, "reward": null, "learning_rate": 1.65215101925646e-05, "epoch": 1.22, "percentage": 61.01, "elapsed_time": "11:35:30", "remaining_time": "7:24:25"} +{"current_steps": 4320, "total_steps": 7064, "loss": 0.7748, "reward": null, "learning_rate": 1.641700033330336e-05, "epoch": 1.22, "percentage": 61.16, "elapsed_time": "11:37:07", "remaining_time": "7:22:47"} +{"current_steps": 4320, "total_steps": 7064, "loss": 0.7748, "reward": null, "learning_rate": 1.641700033330336e-05, "epoch": 1.22, "percentage": 61.16, "elapsed_time": "11:41:00", "remaining_time": "7:25:16"} +{"current_steps": 4320, "total_steps": 7064, "loss": 0.7748, "reward": null, "learning_rate": 1.641700033330336e-05, "epoch": 1.22, "percentage": 61.16, "elapsed_time": "11:37:06", "remaining_time": "7:22:47"} +{"current_steps": 4320, "total_steps": 7064, "loss": 0.7748, "reward": null, "learning_rate": 1.641700033330336e-05, "epoch": 1.22, "percentage": 61.16, "elapsed_time": "11:37:07", "remaining_time": "7:22:48"} +{"current_steps": 4330, "total_steps": 7064, "loss": 0.802, "reward": null, "learning_rate": 1.6312660234580585e-05, "epoch": 1.23, "percentage": 61.3, "elapsed_time": "11:38:43", "remaining_time": "7:21:11"} +{"current_steps": 4330, "total_steps": 7064, "loss": 0.802, "reward": null, "learning_rate": 1.6312660234580585e-05, "epoch": 1.23, "percentage": 61.3, "elapsed_time": "11:38:44", "remaining_time": "7:21:11"} +{"current_steps": 4330, "total_steps": 7064, "loss": 0.802, "reward": null, "learning_rate": 1.6312660234580585e-05, "epoch": 1.23, "percentage": 61.3, "elapsed_time": "11:38:45", "remaining_time": "7:21:12"} +{"current_steps": 4330, "total_steps": 7064, "loss": 0.802, "reward": null, "learning_rate": 1.6312660234580585e-05, "epoch": 1.23, "percentage": 61.3, "elapsed_time": "11:42:38", "remaining_time": "7:23:39"} +{"current_steps": 4340, "total_steps": 7064, "loss": 0.7864, "reward": null, "learning_rate": 1.6208491960107324e-05, "epoch": 1.23, "percentage": 61.44, "elapsed_time": "11:40:24", "remaining_time": "7:19:36"} +{"current_steps": 4340, "total_steps": 7064, "loss": 0.7864, "reward": null, "learning_rate": 1.6208491960107324e-05, "epoch": 1.23, "percentage": 61.44, "elapsed_time": "11:44:18", "remaining_time": "7:22:03"} +{"current_steps": 4340, "total_steps": 7064, "loss": 0.7864, "reward": null, "learning_rate": 1.6208491960107324e-05, "epoch": 1.23, "percentage": 61.44, "elapsed_time": "11:40:26", "remaining_time": "7:19:37"} +{"current_steps": 4340, "total_steps": 7064, "loss": 0.7864, "reward": null, "learning_rate": 1.6208491960107324e-05, "epoch": 1.23, "percentage": 61.44, "elapsed_time": "11:40:25", "remaining_time": "7:19:37"} +{"current_steps": 4350, "total_steps": 7064, "loss": 0.7884, "reward": null, "learning_rate": 1.6104497570196193e-05, "epoch": 1.23, "percentage": 61.58, "elapsed_time": "11:42:04", "remaining_time": "7:18:01"} +{"current_steps": 4350, "total_steps": 7064, "loss": 0.7884, "reward": null, "learning_rate": 1.6104497570196193e-05, "epoch": 1.23, "percentage": 61.58, "elapsed_time": "11:42:02", "remaining_time": "7:18:00"} +{"current_steps": 4350, "total_steps": 7064, "loss": 0.7884, "reward": null, "learning_rate": 1.6104497570196193e-05, "epoch": 1.23, "percentage": 61.58, "elapsed_time": "11:45:57", "remaining_time": "7:20:27"} +{"current_steps": 4350, "total_steps": 7064, "loss": 0.7884, "reward": null, "learning_rate": 1.6104497570196193e-05, "epoch": 1.23, "percentage": 61.58, "elapsed_time": "11:42:03", "remaining_time": "7:18:01"} +{"current_steps": 4360, "total_steps": 7064, "loss": 0.7832, "reward": null, "learning_rate": 1.600067912172057e-05, "epoch": 1.23, "percentage": 61.72, "elapsed_time": "11:43:41", "remaining_time": "7:16:25"} +{"current_steps": 4360, "total_steps": 7064, "loss": 0.7832, "reward": null, "learning_rate": 1.600067912172057e-05, "epoch": 1.23, "percentage": 61.72, "elapsed_time": "11:43:40", "remaining_time": "7:16:24"} +{"current_steps": 4360, "total_steps": 7064, "loss": 0.7832, "reward": null, "learning_rate": 1.600067912172057e-05, "epoch": 1.23, "percentage": 61.72, "elapsed_time": "11:47:35", "remaining_time": "7:18:50"} +{"current_steps": 4360, "total_steps": 7064, "loss": 0.7832, "reward": null, "learning_rate": 1.600067912172057e-05, "epoch": 1.23, "percentage": 61.72, "elapsed_time": "11:43:42", "remaining_time": "7:16:25"} +{"current_steps": 4370, "total_steps": 7064, "loss": 0.8039, "reward": null, "learning_rate": 1.5897038668073965e-05, "epoch": 1.24, "percentage": 61.86, "elapsed_time": "11:45:17", "remaining_time": "7:14:47"} +{"current_steps": 4370, "total_steps": 7064, "loss": 0.8039, "reward": null, "learning_rate": 1.5897038668073965e-05, "epoch": 1.24, "percentage": 61.86, "elapsed_time": "11:49:12", "remaining_time": "7:17:12"} +{"current_steps": 4370, "total_steps": 7064, "loss": 0.8039, "reward": null, "learning_rate": 1.5897038668073965e-05, "epoch": 1.24, "percentage": 61.86, "elapsed_time": "11:45:19", "remaining_time": "7:14:48"} +{"current_steps": 4370, "total_steps": 7064, "loss": 0.8039, "reward": null, "learning_rate": 1.5897038668073965e-05, "epoch": 1.24, "percentage": 61.86, "elapsed_time": "11:45:18", "remaining_time": "7:14:48"} +{"current_steps": 4380, "total_steps": 7064, "loss": 0.7737, "reward": null, "learning_rate": 1.5793578259129355e-05, "epoch": 1.24, "percentage": 62.0, "elapsed_time": "11:46:55", "remaining_time": "7:13:11"} +{"current_steps": 4380, "total_steps": 7064, "loss": 0.7737, "reward": null, "learning_rate": 1.5793578259129355e-05, "epoch": 1.24, "percentage": 62.0, "elapsed_time": "11:50:49", "remaining_time": "7:15:35"} +{"current_steps": 4380, "total_steps": 7064, "loss": 0.7737, "reward": null, "learning_rate": 1.5793578259129355e-05, "epoch": 1.24, "percentage": 62.0, "elapsed_time": "11:46:56", "remaining_time": "7:13:12"} +{"current_steps": 4380, "total_steps": 7064, "loss": 0.7737, "reward": null, "learning_rate": 1.5793578259129355e-05, "epoch": 1.24, "percentage": 62.0, "elapsed_time": "11:46:56", "remaining_time": "7:13:12"} +{"current_steps": 4390, "total_steps": 7064, "loss": 0.7844, "reward": null, "learning_rate": 1.5690299941198706e-05, "epoch": 1.24, "percentage": 62.15, "elapsed_time": "11:48:32", "remaining_time": "7:11:34"} +{"current_steps": 4390, "total_steps": 7064, "loss": 0.7844, "reward": null, "learning_rate": 1.5690299941198706e-05, "epoch": 1.24, "percentage": 62.15, "elapsed_time": "11:48:33", "remaining_time": "7:11:35"} +{"current_steps": 4390, "total_steps": 7064, "loss": 0.7844, "reward": null, "learning_rate": 1.5690299941198706e-05, "epoch": 1.24, "percentage": 62.15, "elapsed_time": "11:48:34", "remaining_time": "7:11:35"} +{"current_steps": 4390, "total_steps": 7064, "loss": 0.7844, "reward": null, "learning_rate": 1.5690299941198706e-05, "epoch": 1.24, "percentage": 62.15, "elapsed_time": "11:52:27", "remaining_time": "7:13:57"} +{"current_steps": 4400, "total_steps": 7064, "loss": 0.7865, "reward": null, "learning_rate": 1.558720575699242e-05, "epoch": 1.25, "percentage": 62.29, "elapsed_time": "11:50:14", "remaining_time": "7:10:01"} +{"current_steps": 4400, "total_steps": 7064, "loss": 0.7865, "reward": null, "learning_rate": 1.558720575699242e-05, "epoch": 1.25, "percentage": 62.29, "elapsed_time": "11:50:15", "remaining_time": "7:10:01"} +{"current_steps": 4400, "total_steps": 7064, "loss": 0.7865, "reward": null, "learning_rate": 1.558720575699242e-05, "epoch": 1.25, "percentage": 62.29, "elapsed_time": "11:54:09", "remaining_time": "7:12:23"} +{"current_steps": 4400, "total_steps": 7064, "loss": 0.7865, "reward": null, "learning_rate": 1.558720575699242e-05, "epoch": 1.25, "percentage": 62.29, "elapsed_time": "11:50:16", "remaining_time": "7:10:02"} +{"current_steps": 4410, "total_steps": 7064, "loss": 0.7983, "reward": null, "learning_rate": 1.548429774557901e-05, "epoch": 1.25, "percentage": 62.43, "elapsed_time": "11:51:56", "remaining_time": "7:08:27"} +{"current_steps": 4410, "total_steps": 7064, "loss": 0.7983, "reward": null, "learning_rate": 1.548429774557901e-05, "epoch": 1.25, "percentage": 62.43, "elapsed_time": "11:51:57", "remaining_time": "7:08:28"} +{"current_steps": 4410, "total_steps": 7064, "loss": 0.7983, "reward": null, "learning_rate": 1.548429774557901e-05, "epoch": 1.25, "percentage": 62.43, "elapsed_time": "11:55:50", "remaining_time": "7:10:48"} +{"current_steps": 4410, "total_steps": 7064, "loss": 0.7983, "reward": null, "learning_rate": 1.548429774557901e-05, "epoch": 1.25, "percentage": 62.43, "elapsed_time": "11:51:56", "remaining_time": "7:08:27"} +{"current_steps": 4420, "total_steps": 7064, "loss": 0.7851, "reward": null, "learning_rate": 1.5381577942344688e-05, "epoch": 1.25, "percentage": 62.57, "elapsed_time": "11:53:36", "remaining_time": "7:06:52"} +{"current_steps": 4420, "total_steps": 7064, "loss": 0.7851, "reward": null, "learning_rate": 1.5381577942344688e-05, "epoch": 1.25, "percentage": 62.57, "elapsed_time": "11:57:30", "remaining_time": "7:09:12"} +{"current_steps": 4420, "total_steps": 7064, "loss": 0.7851, "reward": null, "learning_rate": 1.5381577942344688e-05, "epoch": 1.25, "percentage": 62.57, "elapsed_time": "11:53:37", "remaining_time": "7:06:53"} +{"current_steps": 4420, "total_steps": 7064, "loss": 0.7851, "reward": null, "learning_rate": 1.5381577942344688e-05, "epoch": 1.25, "percentage": 62.57, "elapsed_time": "11:53:37", "remaining_time": "7:06:52"} +{"current_steps": 4430, "total_steps": 7064, "loss": 0.7798, "reward": null, "learning_rate": 1.5279048378953222e-05, "epoch": 1.25, "percentage": 62.71, "elapsed_time": "11:55:14", "remaining_time": "7:05:15"} +{"current_steps": 4430, "total_steps": 7064, "loss": 0.7798, "reward": null, "learning_rate": 1.5279048378953222e-05, "epoch": 1.25, "percentage": 62.71, "elapsed_time": "11:55:13", "remaining_time": "7:05:15"} +{"current_steps": 4430, "total_steps": 7064, "loss": 0.7798, "reward": null, "learning_rate": 1.5279048378953222e-05, "epoch": 1.25, "percentage": 62.71, "elapsed_time": "11:55:14", "remaining_time": "7:05:16"} +{"current_steps": 4430, "total_steps": 7064, "loss": 0.7798, "reward": null, "learning_rate": 1.5279048378953222e-05, "epoch": 1.25, "percentage": 62.71, "elapsed_time": "11:59:07", "remaining_time": "7:07:34"} +{"current_steps": 4440, "total_steps": 7064, "loss": 0.79, "reward": null, "learning_rate": 1.517671108330561e-05, "epoch": 1.26, "percentage": 62.85, "elapsed_time": "11:56:46", "remaining_time": "7:03:36"} +{"current_steps": 4440, "total_steps": 7064, "loss": 0.79, "reward": null, "learning_rate": 1.517671108330561e-05, "epoch": 1.26, "percentage": 62.85, "elapsed_time": "12:00:41", "remaining_time": "7:05:55"} +{"current_steps": 4440, "total_steps": 7064, "loss": 0.79, "reward": null, "learning_rate": 1.517671108330561e-05, "epoch": 1.26, "percentage": 62.85, "elapsed_time": "11:56:48", "remaining_time": "7:03:37"} +{"current_steps": 4440, "total_steps": 7064, "loss": 0.79, "reward": null, "learning_rate": 1.517671108330561e-05, "epoch": 1.26, "percentage": 62.85, "elapsed_time": "11:56:47", "remaining_time": "7:03:36"} +{"current_steps": 4450, "total_steps": 7064, "loss": 0.7694, "reward": null, "learning_rate": 1.5074568079500109e-05, "epoch": 1.26, "percentage": 63.0, "elapsed_time": "11:58:27", "remaining_time": "7:02:02"} +{"current_steps": 4450, "total_steps": 7064, "loss": 0.7694, "reward": null, "learning_rate": 1.5074568079500109e-05, "epoch": 1.26, "percentage": 63.0, "elapsed_time": "12:02:21", "remaining_time": "7:04:19"} +{"current_steps": 4450, "total_steps": 7064, "loss": 0.7694, "reward": null, "learning_rate": 1.5074568079500109e-05, "epoch": 1.26, "percentage": 63.0, "elapsed_time": "11:58:28", "remaining_time": "7:02:02"} +{"current_steps": 4450, "total_steps": 7064, "loss": 0.7694, "reward": null, "learning_rate": 1.5074568079500109e-05, "epoch": 1.26, "percentage": 63.0, "elapsed_time": "11:58:26", "remaining_time": "7:02:01"} +{"current_steps": 4460, "total_steps": 7064, "loss": 0.7874, "reward": null, "learning_rate": 1.497262138779208e-05, "epoch": 1.26, "percentage": 63.14, "elapsed_time": "12:00:05", "remaining_time": "7:00:25"} +{"current_steps": 4460, "total_steps": 7064, "loss": 0.7874, "reward": null, "learning_rate": 1.497262138779208e-05, "epoch": 1.26, "percentage": 63.14, "elapsed_time": "12:00:04", "remaining_time": "7:00:25"} +{"current_steps": 4460, "total_steps": 7064, "loss": 0.7874, "reward": null, "learning_rate": 1.497262138779208e-05, "epoch": 1.26, "percentage": 63.14, "elapsed_time": "12:03:58", "remaining_time": "7:02:41"} +{"current_steps": 4460, "total_steps": 7064, "loss": 0.7874, "reward": null, "learning_rate": 1.497262138779208e-05, "epoch": 1.26, "percentage": 63.14, "elapsed_time": "12:00:03", "remaining_time": "7:00:24"} +{"current_steps": 4470, "total_steps": 7064, "loss": 0.7878, "reward": null, "learning_rate": 1.4870873024554138e-05, "epoch": 1.27, "percentage": 63.28, "elapsed_time": "12:01:40", "remaining_time": "6:58:47"} +{"current_steps": 4470, "total_steps": 7064, "loss": 0.7878, "reward": null, "learning_rate": 1.4870873024554138e-05, "epoch": 1.27, "percentage": 63.28, "elapsed_time": "12:05:35", "remaining_time": "7:01:04"} +{"current_steps": 4470, "total_steps": 7064, "loss": 0.7878, "reward": null, "learning_rate": 1.4870873024554138e-05, "epoch": 1.27, "percentage": 63.28, "elapsed_time": "12:01:42", "remaining_time": "6:58:48"} +{"current_steps": 4470, "total_steps": 7064, "loss": 0.7878, "reward": null, "learning_rate": 1.4870873024554138e-05, "epoch": 1.27, "percentage": 63.28, "elapsed_time": "12:01:41", "remaining_time": "6:58:48"} +{"current_steps": 4480, "total_steps": 7064, "loss": 0.7992, "reward": null, "learning_rate": 1.4769325002236183e-05, "epoch": 1.27, "percentage": 63.42, "elapsed_time": "12:03:21", "remaining_time": "6:57:13"} +{"current_steps": 4480, "total_steps": 7064, "loss": 0.7992, "reward": null, "learning_rate": 1.4769325002236183e-05, "epoch": 1.27, "percentage": 63.42, "elapsed_time": "12:07:15", "remaining_time": "6:59:28"} +{"current_steps": 4480, "total_steps": 7064, "loss": 0.7992, "reward": null, "learning_rate": 1.4769325002236183e-05, "epoch": 1.27, "percentage": 63.42, "elapsed_time": "12:03:22", "remaining_time": "6:57:14"} +{"current_steps": 4480, "total_steps": 7064, "loss": 0.7992, "reward": null, "learning_rate": 1.4769325002236183e-05, "epoch": 1.27, "percentage": 63.42, "elapsed_time": "12:03:21", "remaining_time": "6:57:13"} +{"current_steps": 4490, "total_steps": 7064, "loss": 0.8003, "reward": null, "learning_rate": 1.4667979329325651e-05, "epoch": 1.27, "percentage": 63.56, "elapsed_time": "12:04:57", "remaining_time": "6:55:35"} +{"current_steps": 4490, "total_steps": 7064, "loss": 0.8003, "reward": null, "learning_rate": 1.4667979329325651e-05, "epoch": 1.27, "percentage": 63.56, "elapsed_time": "12:04:56", "remaining_time": "6:55:35"} +{"current_steps": 4490, "total_steps": 7064, "loss": 0.8003, "reward": null, "learning_rate": 1.4667979329325651e-05, "epoch": 1.27, "percentage": 63.56, "elapsed_time": "12:04:58", "remaining_time": "6:55:36"} +{"current_steps": 4490, "total_steps": 7064, "loss": 0.8003, "reward": null, "learning_rate": 1.4667979329325651e-05, "epoch": 1.27, "percentage": 63.56, "elapsed_time": "12:08:51", "remaining_time": "6:57:49"} +{"current_steps": 4500, "total_steps": 7064, "loss": 0.7778, "reward": null, "learning_rate": 1.4566838010307754e-05, "epoch": 1.27, "percentage": 63.7, "elapsed_time": "12:10:26", "remaining_time": "6:56:11"} +{"current_steps": 4500, "total_steps": 7064, "loss": 0.7778, "reward": null, "learning_rate": 1.4566838010307754e-05, "epoch": 1.27, "percentage": 63.7, "elapsed_time": "12:06:32", "remaining_time": "6:53:57"} +{"current_steps": 4500, "total_steps": 7064, "loss": 0.7778, "reward": null, "learning_rate": 1.4566838010307754e-05, "epoch": 1.27, "percentage": 63.7, "elapsed_time": "12:06:33", "remaining_time": "6:53:58"} +{"current_steps": 4500, "total_steps": 7064, "loss": 0.7778, "reward": null, "learning_rate": 1.4566838010307754e-05, "epoch": 1.27, "percentage": 63.7, "elapsed_time": "12:06:33", "remaining_time": "6:53:58"} +{"current_steps": 4510, "total_steps": 7064, "loss": 0.773, "reward": null, "learning_rate": 1.4465903045625878e-05, "epoch": 1.28, "percentage": 63.84, "elapsed_time": "12:08:14", "remaining_time": "6:52:24"} +{"current_steps": 4510, "total_steps": 7064, "loss": 0.773, "reward": null, "learning_rate": 1.4465903045625878e-05, "epoch": 1.28, "percentage": 63.84, "elapsed_time": "12:12:09", "remaining_time": "6:54:36"} +{"current_steps": 4510, "total_steps": 7064, "loss": 0.773, "reward": null, "learning_rate": 1.4465903045625878e-05, "epoch": 1.28, "percentage": 63.84, "elapsed_time": "12:08:16", "remaining_time": "6:52:24"} +{"current_steps": 4510, "total_steps": 7064, "loss": 0.773, "reward": null, "learning_rate": 1.4465903045625878e-05, "epoch": 1.28, "percentage": 63.84, "elapsed_time": "12:08:15", "remaining_time": "6:52:24"} +{"current_steps": 4520, "total_steps": 7064, "loss": 0.7872, "reward": null, "learning_rate": 1.4365176431641958e-05, "epoch": 1.28, "percentage": 63.99, "elapsed_time": "12:09:55", "remaining_time": "6:50:49"} +{"current_steps": 4520, "total_steps": 7064, "loss": 0.7872, "reward": null, "learning_rate": 1.4365176431641958e-05, "epoch": 1.28, "percentage": 63.99, "elapsed_time": "12:09:55", "remaining_time": "6:50:49"} +{"current_steps": 4520, "total_steps": 7064, "loss": 0.7872, "reward": null, "learning_rate": 1.4365176431641958e-05, "epoch": 1.28, "percentage": 63.99, "elapsed_time": "12:13:48", "remaining_time": "6:53:00"} +{"current_steps": 4520, "total_steps": 7064, "loss": 0.7872, "reward": null, "learning_rate": 1.4365176431641958e-05, "epoch": 1.28, "percentage": 63.99, "elapsed_time": "12:09:54", "remaining_time": "6:50:48"} +{"current_steps": 4530, "total_steps": 7064, "loss": 0.7977, "reward": null, "learning_rate": 1.4264660160597057e-05, "epoch": 1.28, "percentage": 64.13, "elapsed_time": "12:11:34", "remaining_time": "6:49:13"} +{"current_steps": 4530, "total_steps": 7064, "loss": 0.7977, "reward": null, "learning_rate": 1.4264660160597057e-05, "epoch": 1.28, "percentage": 64.13, "elapsed_time": "12:11:33", "remaining_time": "6:49:13"} +{"current_steps": 4530, "total_steps": 7064, "loss": 0.7977, "reward": null, "learning_rate": 1.4264660160597057e-05, "epoch": 1.28, "percentage": 64.13, "elapsed_time": "12:15:27", "remaining_time": "6:51:24"} +{"current_steps": 4530, "total_steps": 7064, "loss": 0.7977, "reward": null, "learning_rate": 1.4264660160597057e-05, "epoch": 1.28, "percentage": 64.13, "elapsed_time": "12:11:32", "remaining_time": "6:49:12"} +{"current_steps": 4540, "total_steps": 7064, "loss": 0.7792, "reward": null, "learning_rate": 1.41643562205719e-05, "epoch": 1.29, "percentage": 64.27, "elapsed_time": "12:17:02", "remaining_time": "6:49:45"} +{"current_steps": 4540, "total_steps": 7064, "loss": 0.7792, "reward": null, "learning_rate": 1.41643562205719e-05, "epoch": 1.29, "percentage": 64.27, "elapsed_time": "12:13:08", "remaining_time": "6:47:35"} +{"current_steps": 4540, "total_steps": 7064, "loss": 0.7792, "reward": null, "learning_rate": 1.41643562205719e-05, "epoch": 1.29, "percentage": 64.27, "elapsed_time": "12:13:09", "remaining_time": "6:47:35"} +{"current_steps": 4540, "total_steps": 7064, "loss": 0.7792, "reward": null, "learning_rate": 1.41643562205719e-05, "epoch": 1.29, "percentage": 64.27, "elapsed_time": "12:13:07", "remaining_time": "6:47:34"} +{"current_steps": 4550, "total_steps": 7064, "loss": 0.7792, "reward": null, "learning_rate": 1.4064266595447584e-05, "epoch": 1.29, "percentage": 64.41, "elapsed_time": "12:14:43", "remaining_time": "6:45:57"} +{"current_steps": 4550, "total_steps": 7064, "loss": 0.7792, "reward": null, "learning_rate": 1.4064266595447584e-05, "epoch": 1.29, "percentage": 64.41, "elapsed_time": "12:18:37", "remaining_time": "6:48:06"} +{"current_steps": 4550, "total_steps": 7064, "loss": 0.7792, "reward": null, "learning_rate": 1.4064266595447584e-05, "epoch": 1.29, "percentage": 64.41, "elapsed_time": "12:14:44", "remaining_time": "6:45:58"} +{"current_steps": 4550, "total_steps": 7064, "loss": 0.7792, "reward": null, "learning_rate": 1.4064266595447584e-05, "epoch": 1.29, "percentage": 64.41, "elapsed_time": "12:14:44", "remaining_time": "6:45:57"} +{"current_steps": 4560, "total_steps": 7064, "loss": 0.7836, "reward": null, "learning_rate": 1.3964393264866368e-05, "epoch": 1.29, "percentage": 64.55, "elapsed_time": "12:20:16", "remaining_time": "6:46:29"} +{"current_steps": 4560, "total_steps": 7064, "loss": 0.7836, "reward": null, "learning_rate": 1.3964393264866368e-05, "epoch": 1.29, "percentage": 64.55, "elapsed_time": "12:16:22", "remaining_time": "6:44:21"} +{"current_steps": 4560, "total_steps": 7064, "loss": 0.7836, "reward": null, "learning_rate": 1.3964393264866368e-05, "epoch": 1.29, "percentage": 64.55, "elapsed_time": "12:16:23", "remaining_time": "6:44:22"} +{"current_steps": 4560, "total_steps": 7064, "loss": 0.7836, "reward": null, "learning_rate": 1.3964393264866368e-05, "epoch": 1.29, "percentage": 64.55, "elapsed_time": "12:16:21", "remaining_time": "6:44:21"} +{"current_steps": 4570, "total_steps": 7064, "loss": 0.8005, "reward": null, "learning_rate": 1.386473820419244e-05, "epoch": 1.29, "percentage": 64.69, "elapsed_time": "12:17:56", "remaining_time": "6:42:43"} +{"current_steps": 4570, "total_steps": 7064, "loss": 0.8005, "reward": null, "learning_rate": 1.386473820419244e-05, "epoch": 1.29, "percentage": 64.69, "elapsed_time": "12:17:57", "remaining_time": "6:42:43"} +{"current_steps": 4570, "total_steps": 7064, "loss": 0.8005, "reward": null, "learning_rate": 1.386473820419244e-05, "epoch": 1.29, "percentage": 64.69, "elapsed_time": "12:17:58", "remaining_time": "6:42:43"} +{"current_steps": 4570, "total_steps": 7064, "loss": 0.8005, "reward": null, "learning_rate": 1.386473820419244e-05, "epoch": 1.29, "percentage": 64.69, "elapsed_time": "12:21:50", "remaining_time": "6:44:51"} +{"current_steps": 4580, "total_steps": 7064, "loss": 0.7937, "reward": null, "learning_rate": 1.376530338447294e-05, "epoch": 1.3, "percentage": 64.84, "elapsed_time": "12:19:33", "remaining_time": "6:41:06"} +{"current_steps": 4580, "total_steps": 7064, "loss": 0.7937, "reward": null, "learning_rate": 1.376530338447294e-05, "epoch": 1.3, "percentage": 64.84, "elapsed_time": "12:19:34", "remaining_time": "6:41:06"} +{"current_steps": 4580, "total_steps": 7064, "loss": 0.7937, "reward": null, "learning_rate": 1.376530338447294e-05, "epoch": 1.3, "percentage": 64.84, "elapsed_time": "12:23:27", "remaining_time": "6:43:13"} +{"current_steps": 4580, "total_steps": 7064, "loss": 0.7937, "reward": null, "learning_rate": 1.376530338447294e-05, "epoch": 1.3, "percentage": 64.84, "elapsed_time": "12:19:34", "remaining_time": "6:41:07"} +{"current_steps": 4590, "total_steps": 7064, "loss": 0.7692, "reward": null, "learning_rate": 1.366609077239889e-05, "epoch": 1.3, "percentage": 64.98, "elapsed_time": "12:21:10", "remaining_time": "6:39:29"} +{"current_steps": 4590, "total_steps": 7064, "loss": 0.7692, "reward": null, "learning_rate": 1.366609077239889e-05, "epoch": 1.3, "percentage": 64.98, "elapsed_time": "12:21:09", "remaining_time": "6:39:28"} +{"current_steps": 4590, "total_steps": 7064, "loss": 0.7692, "reward": null, "learning_rate": 1.366609077239889e-05, "epoch": 1.3, "percentage": 64.98, "elapsed_time": "12:25:02", "remaining_time": "6:41:34"} +{"current_steps": 4590, "total_steps": 7064, "loss": 0.7692, "reward": null, "learning_rate": 1.366609077239889e-05, "epoch": 1.3, "percentage": 64.98, "elapsed_time": "12:21:08", "remaining_time": "6:39:28"} +{"current_steps": 4600, "total_steps": 7064, "loss": 0.7926, "reward": null, "learning_rate": 1.3567102330266369e-05, "epoch": 1.3, "percentage": 65.12, "elapsed_time": "12:22:46", "remaining_time": "6:37:51"} +{"current_steps": 4600, "total_steps": 7064, "loss": 0.7926, "reward": null, "learning_rate": 1.3567102330266369e-05, "epoch": 1.3, "percentage": 65.12, "elapsed_time": "12:26:39", "remaining_time": "6:39:57"} +{"current_steps": 4600, "total_steps": 7064, "loss": 0.7926, "reward": null, "learning_rate": 1.3567102330266369e-05, "epoch": 1.3, "percentage": 65.12, "elapsed_time": "12:22:45", "remaining_time": "6:37:51"} +{"current_steps": 4600, "total_steps": 7064, "loss": 0.7926, "reward": null, "learning_rate": 1.3567102330266369e-05, "epoch": 1.3, "percentage": 65.12, "elapsed_time": "12:22:47", "remaining_time": "6:37:52"} +{"current_steps": 4610, "total_steps": 7064, "loss": 0.7725, "reward": null, "learning_rate": 1.3468340015937642e-05, "epoch": 1.31, "percentage": 65.26, "elapsed_time": "12:24:19", "remaining_time": "6:36:13"} +{"current_steps": 4610, "total_steps": 7064, "loss": 0.7725, "reward": null, "learning_rate": 1.3468340015937642e-05, "epoch": 1.31, "percentage": 65.26, "elapsed_time": "12:24:20", "remaining_time": "6:36:13"} +{"current_steps": 4610, "total_steps": 7064, "loss": 0.7725, "reward": null, "learning_rate": 1.3468340015937642e-05, "epoch": 1.31, "percentage": 65.26, "elapsed_time": "12:24:21", "remaining_time": "6:36:14"} +{"current_steps": 4610, "total_steps": 7064, "loss": 0.7725, "reward": null, "learning_rate": 1.3468340015937642e-05, "epoch": 1.31, "percentage": 65.26, "elapsed_time": "12:28:14", "remaining_time": "6:38:18"} +{"current_steps": 4620, "total_steps": 7064, "loss": 0.7936, "reward": null, "learning_rate": 1.3369805782802467e-05, "epoch": 1.31, "percentage": 65.4, "elapsed_time": "12:25:56", "remaining_time": "6:34:36"} +{"current_steps": 4620, "total_steps": 7064, "loss": 0.7936, "reward": null, "learning_rate": 1.3369805782802467e-05, "epoch": 1.31, "percentage": 65.4, "elapsed_time": "12:25:57", "remaining_time": "6:34:36"} +{"current_steps": 4620, "total_steps": 7064, "loss": 0.7936, "reward": null, "learning_rate": 1.3369805782802467e-05, "epoch": 1.31, "percentage": 65.4, "elapsed_time": "12:29:50", "remaining_time": "6:36:40"} +{"current_steps": 4620, "total_steps": 7064, "loss": 0.7936, "reward": null, "learning_rate": 1.3369805782802467e-05, "epoch": 1.31, "percentage": 65.4, "elapsed_time": "12:25:55", "remaining_time": "6:34:35"} +{"current_steps": 4630, "total_steps": 7064, "loss": 0.7776, "reward": null, "learning_rate": 1.3271501579739449e-05, "epoch": 1.31, "percentage": 65.54, "elapsed_time": "12:27:29", "remaining_time": "6:32:57"} +{"current_steps": 4630, "total_steps": 7064, "loss": 0.7776, "reward": null, "learning_rate": 1.3271501579739449e-05, "epoch": 1.31, "percentage": 65.54, "elapsed_time": "12:27:31", "remaining_time": "6:32:58"} +{"current_steps": 4630, "total_steps": 7064, "loss": 0.7776, "reward": null, "learning_rate": 1.3271501579739449e-05, "epoch": 1.31, "percentage": 65.54, "elapsed_time": "12:31:24", "remaining_time": "6:35:00"} +{"current_steps": 4630, "total_steps": 7064, "loss": 0.7776, "reward": null, "learning_rate": 1.3271501579739449e-05, "epoch": 1.31, "percentage": 65.54, "elapsed_time": "12:27:30", "remaining_time": "6:32:57"} +{"current_steps": 4640, "total_steps": 7064, "loss": 0.7785, "reward": null, "learning_rate": 1.317342935107752e-05, "epoch": 1.31, "percentage": 65.69, "elapsed_time": "12:29:12", "remaining_time": "6:31:23"} +{"current_steps": 4640, "total_steps": 7064, "loss": 0.7785, "reward": null, "learning_rate": 1.317342935107752e-05, "epoch": 1.31, "percentage": 65.69, "elapsed_time": "12:33:06", "remaining_time": "6:33:25"} +{"current_steps": 4640, "total_steps": 7064, "loss": 0.7785, "reward": null, "learning_rate": 1.317342935107752e-05, "epoch": 1.31, "percentage": 65.69, "elapsed_time": "12:29:13", "remaining_time": "6:31:24"} +{"current_steps": 4640, "total_steps": 7064, "loss": 0.7785, "reward": null, "learning_rate": 1.317342935107752e-05, "epoch": 1.31, "percentage": 65.69, "elapsed_time": "12:29:11", "remaining_time": "6:31:23"} +{"current_steps": 4650, "total_steps": 7064, "loss": 0.7735, "reward": null, "learning_rate": 1.307559103655743e-05, "epoch": 1.32, "percentage": 65.83, "elapsed_time": "12:30:49", "remaining_time": "6:29:47"} +{"current_steps": 4650, "total_steps": 7064, "loss": 0.7735, "reward": null, "learning_rate": 1.307559103655743e-05, "epoch": 1.32, "percentage": 65.83, "elapsed_time": "12:34:42", "remaining_time": "6:31:48"} +{"current_steps": 4650, "total_steps": 7064, "loss": 0.7735, "reward": null, "learning_rate": 1.307559103655743e-05, "epoch": 1.32, "percentage": 65.83, "elapsed_time": "12:30:48", "remaining_time": "6:29:46"} +{"current_steps": 4650, "total_steps": 7064, "loss": 0.7735, "reward": null, "learning_rate": 1.307559103655743e-05, "epoch": 1.32, "percentage": 65.83, "elapsed_time": "12:30:48", "remaining_time": "6:29:46"} +{"current_steps": 4660, "total_steps": 7064, "loss": 0.7925, "reward": null, "learning_rate": 1.2977988571293447e-05, "epoch": 1.32, "percentage": 65.97, "elapsed_time": "12:32:22", "remaining_time": "6:28:07"} +{"current_steps": 4660, "total_steps": 7064, "loss": 0.7925, "reward": null, "learning_rate": 1.2977988571293447e-05, "epoch": 1.32, "percentage": 65.97, "elapsed_time": "12:32:23", "remaining_time": "6:28:08"} +{"current_steps": 4660, "total_steps": 7064, "loss": 0.7925, "reward": null, "learning_rate": 1.2977988571293447e-05, "epoch": 1.32, "percentage": 65.97, "elapsed_time": "12:36:16", "remaining_time": "6:30:08"} +{"current_steps": 4660, "total_steps": 7064, "loss": 0.7925, "reward": null, "learning_rate": 1.2977988571293447e-05, "epoch": 1.32, "percentage": 65.97, "elapsed_time": "12:32:23", "remaining_time": "6:28:08"} +{"current_steps": 4670, "total_steps": 7064, "loss": 0.7846, "reward": null, "learning_rate": 1.288062388573501e-05, "epoch": 1.32, "percentage": 66.11, "elapsed_time": "12:33:59", "remaining_time": "6:26:31"} +{"current_steps": 4670, "total_steps": 7064, "loss": 0.7846, "reward": null, "learning_rate": 1.288062388573501e-05, "epoch": 1.32, "percentage": 66.11, "elapsed_time": "12:37:54", "remaining_time": "6:28:31"} +{"current_steps": 4670, "total_steps": 7064, "loss": 0.7846, "reward": null, "learning_rate": 1.288062388573501e-05, "epoch": 1.32, "percentage": 66.11, "elapsed_time": "12:34:01", "remaining_time": "6:26:32"} +{"current_steps": 4670, "total_steps": 7064, "loss": 0.7846, "reward": null, "learning_rate": 1.288062388573501e-05, "epoch": 1.32, "percentage": 66.11, "elapsed_time": "12:34:00", "remaining_time": "6:26:31"} +{"current_steps": 4680, "total_steps": 7064, "loss": 0.7782, "reward": null, "learning_rate": 1.2783498905628622e-05, "epoch": 1.33, "percentage": 66.25, "elapsed_time": "12:35:38", "remaining_time": "6:24:55"} +{"current_steps": 4680, "total_steps": 7064, "loss": 0.7782, "reward": null, "learning_rate": 1.2783498905628622e-05, "epoch": 1.33, "percentage": 66.25, "elapsed_time": "12:39:32", "remaining_time": "6:26:54"} +{"current_steps": 4680, "total_steps": 7064, "loss": 0.7782, "reward": null, "learning_rate": 1.2783498905628622e-05, "epoch": 1.33, "percentage": 66.25, "elapsed_time": "12:35:39", "remaining_time": "6:24:55"} +{"current_steps": 4680, "total_steps": 7064, "loss": 0.7782, "reward": null, "learning_rate": 1.2783498905628622e-05, "epoch": 1.33, "percentage": 66.25, "elapsed_time": "12:35:39", "remaining_time": "6:24:56"} +{"current_steps": 4690, "total_steps": 7064, "loss": 0.7888, "reward": null, "learning_rate": 1.2696292959503922e-05, "epoch": 1.33, "percentage": 66.39, "elapsed_time": "12:37:15", "remaining_time": "6:23:18"} +{"current_steps": 4690, "total_steps": 7064, "loss": 0.7888, "reward": null, "learning_rate": 1.2696292959503922e-05, "epoch": 1.33, "percentage": 66.39, "elapsed_time": "12:37:16", "remaining_time": "6:23:19"} +{"current_steps": 4690, "total_steps": 7064, "loss": 0.7888, "reward": null, "learning_rate": 1.2696292959503922e-05, "epoch": 1.33, "percentage": 66.39, "elapsed_time": "12:41:10", "remaining_time": "6:25:17"} +{"current_steps": 4690, "total_steps": 7064, "loss": 0.7888, "reward": null, "learning_rate": 1.2696292959503922e-05, "epoch": 1.33, "percentage": 66.39, "elapsed_time": "12:37:17", "remaining_time": "6:23:19"} +{"current_steps": 4700, "total_steps": 7064, "loss": 0.7898, "reward": null, "learning_rate": 1.2599628708177253e-05, "epoch": 1.33, "percentage": 66.53, "elapsed_time": "12:38:51", "remaining_time": "6:21:41"} +{"current_steps": 4700, "total_steps": 7064, "loss": 0.7898, "reward": null, "learning_rate": 1.2599628708177253e-05, "epoch": 1.33, "percentage": 66.53, "elapsed_time": "12:42:46", "remaining_time": "6:23:39"} +{"current_steps": 4700, "total_steps": 7064, "loss": 0.7898, "reward": null, "learning_rate": 1.2599628708177253e-05, "epoch": 1.33, "percentage": 66.53, "elapsed_time": "12:38:53", "remaining_time": "6:21:42"} +{"current_steps": 4700, "total_steps": 7064, "loss": 0.7898, "reward": null, "learning_rate": 1.2599628708177253e-05, "epoch": 1.33, "percentage": 66.53, "elapsed_time": "12:38:52", "remaining_time": "6:21:41"} +{"current_steps": 4710, "total_steps": 7064, "loss": 0.7956, "reward": null, "learning_rate": 1.250320972002072e-05, "epoch": 1.33, "percentage": 66.68, "elapsed_time": "12:40:30", "remaining_time": "6:20:05"} +{"current_steps": 4710, "total_steps": 7064, "loss": 0.7956, "reward": null, "learning_rate": 1.250320972002072e-05, "epoch": 1.33, "percentage": 66.68, "elapsed_time": "12:44:24", "remaining_time": "6:22:02"} +{"current_steps": 4710, "total_steps": 7064, "loss": 0.7956, "reward": null, "learning_rate": 1.250320972002072e-05, "epoch": 1.33, "percentage": 66.68, "elapsed_time": "12:40:31", "remaining_time": "6:20:06"} +{"current_steps": 4710, "total_steps": 7064, "loss": 0.7956, "reward": null, "learning_rate": 1.250320972002072e-05, "epoch": 1.33, "percentage": 66.68, "elapsed_time": "12:40:29", "remaining_time": "6:20:05"} +{"current_steps": 4720, "total_steps": 7064, "loss": 0.7735, "reward": null, "learning_rate": 1.2407037902076168e-05, "epoch": 1.34, "percentage": 66.82, "elapsed_time": "12:42:10", "remaining_time": "6:18:30"} +{"current_steps": 4720, "total_steps": 7064, "loss": 0.7735, "reward": null, "learning_rate": 1.2407037902076168e-05, "epoch": 1.34, "percentage": 66.82, "elapsed_time": "12:46:04", "remaining_time": "6:20:26"} +{"current_steps": 4720, "total_steps": 7064, "loss": 0.7735, "reward": null, "learning_rate": 1.2407037902076168e-05, "epoch": 1.34, "percentage": 66.82, "elapsed_time": "12:42:11", "remaining_time": "6:18:30"} +{"current_steps": 4720, "total_steps": 7064, "loss": 0.7735, "reward": null, "learning_rate": 1.2407037902076168e-05, "epoch": 1.34, "percentage": 66.82, "elapsed_time": "12:42:11", "remaining_time": "6:18:30"} +{"current_steps": 4730, "total_steps": 7064, "loss": 0.7842, "reward": null, "learning_rate": 1.23111151564967e-05, "epoch": 1.34, "percentage": 66.96, "elapsed_time": "12:43:45", "remaining_time": "6:16:52"} +{"current_steps": 4730, "total_steps": 7064, "loss": 0.7842, "reward": null, "learning_rate": 1.23111151564967e-05, "epoch": 1.34, "percentage": 66.96, "elapsed_time": "12:43:46", "remaining_time": "6:16:52"} +{"current_steps": 4730, "total_steps": 7064, "loss": 0.7842, "reward": null, "learning_rate": 1.23111151564967e-05, "epoch": 1.34, "percentage": 66.96, "elapsed_time": "12:47:40", "remaining_time": "6:18:48"} +{"current_steps": 4730, "total_steps": 7064, "loss": 0.7842, "reward": null, "learning_rate": 1.23111151564967e-05, "epoch": 1.34, "percentage": 66.96, "elapsed_time": "12:43:47", "remaining_time": "6:16:53"} +{"current_steps": 4740, "total_steps": 7064, "loss": 0.7892, "reward": null, "learning_rate": 1.2215443380509125e-05, "epoch": 1.34, "percentage": 67.1, "elapsed_time": "12:45:21", "remaining_time": "6:15:14"} +{"current_steps": 4740, "total_steps": 7064, "loss": 0.7892, "reward": null, "learning_rate": 1.2215443380509125e-05, "epoch": 1.34, "percentage": 67.1, "elapsed_time": "12:45:21", "remaining_time": "6:15:15"} +{"current_steps": 4740, "total_steps": 7064, "loss": 0.7892, "reward": null, "learning_rate": 1.2215443380509125e-05, "epoch": 1.34, "percentage": 67.1, "elapsed_time": "12:45:22", "remaining_time": "6:15:15"} +{"current_steps": 4740, "total_steps": 7064, "loss": 0.7892, "reward": null, "learning_rate": 1.2215443380509125e-05, "epoch": 1.34, "percentage": 67.1, "elapsed_time": "12:49:15", "remaining_time": "6:17:09"} +{"current_steps": 4750, "total_steps": 7064, "loss": 0.7822, "reward": null, "learning_rate": 1.2120024466376381e-05, "epoch": 1.34, "percentage": 67.24, "elapsed_time": "12:50:57", "remaining_time": "6:15:34"} +{"current_steps": 4750, "total_steps": 7064, "loss": 0.7822, "reward": null, "learning_rate": 1.2120024466376381e-05, "epoch": 1.34, "percentage": 67.24, "elapsed_time": "12:47:03", "remaining_time": "6:13:40"} +{"current_steps": 4750, "total_steps": 7064, "loss": 0.7822, "reward": null, "learning_rate": 1.2120024466376381e-05, "epoch": 1.34, "percentage": 67.24, "elapsed_time": "12:47:04", "remaining_time": "6:13:41"} +{"current_steps": 4750, "total_steps": 7064, "loss": 0.7822, "reward": null, "learning_rate": 1.2120024466376381e-05, "epoch": 1.34, "percentage": 67.24, "elapsed_time": "12:47:02", "remaining_time": "6:13:40"} +{"current_steps": 4760, "total_steps": 7064, "loss": 0.7788, "reward": null, "learning_rate": 1.2024860301360131e-05, "epoch": 1.35, "percentage": 67.38, "elapsed_time": "12:52:32", "remaining_time": "6:13:56"} +{"current_steps": 4760, "total_steps": 7064, "loss": 0.7788, "reward": null, "learning_rate": 1.2024860301360131e-05, "epoch": 1.35, "percentage": 67.38, "elapsed_time": "12:48:37", "remaining_time": "6:12:02"} +{"current_steps": 4760, "total_steps": 7064, "loss": 0.7788, "reward": null, "learning_rate": 1.2024860301360131e-05, "epoch": 1.35, "percentage": 67.38, "elapsed_time": "12:48:39", "remaining_time": "6:12:03"} +{"current_steps": 4760, "total_steps": 7064, "loss": 0.7788, "reward": null, "learning_rate": 1.2024860301360131e-05, "epoch": 1.35, "percentage": 67.38, "elapsed_time": "12:48:38", "remaining_time": "6:12:02"} +{"current_steps": 4770, "total_steps": 7064, "loss": 0.7824, "reward": null, "learning_rate": 1.1929952767683426e-05, "epoch": 1.35, "percentage": 67.53, "elapsed_time": "12:50:17", "remaining_time": "6:10:26"} +{"current_steps": 4770, "total_steps": 7064, "loss": 0.7824, "reward": null, "learning_rate": 1.1929952767683426e-05, "epoch": 1.35, "percentage": 67.53, "elapsed_time": "12:54:10", "remaining_time": "6:12:19"} +{"current_steps": 4770, "total_steps": 7064, "loss": 0.7824, "reward": null, "learning_rate": 1.1929952767683426e-05, "epoch": 1.35, "percentage": 67.53, "elapsed_time": "12:50:16", "remaining_time": "6:10:26"} +{"current_steps": 4770, "total_steps": 7064, "loss": 0.7824, "reward": null, "learning_rate": 1.1929952767683426e-05, "epoch": 1.35, "percentage": 67.53, "elapsed_time": "12:50:17", "remaining_time": "6:10:27"} +{"current_steps": 4780, "total_steps": 7064, "loss": 0.7859, "reward": null, "learning_rate": 1.1835303742493508e-05, "epoch": 1.35, "percentage": 67.67, "elapsed_time": "12:55:46", "remaining_time": "6:10:40"} +{"current_steps": 4780, "total_steps": 7064, "loss": 0.7859, "reward": null, "learning_rate": 1.1835303742493508e-05, "epoch": 1.35, "percentage": 67.67, "elapsed_time": "12:51:53", "remaining_time": "6:08:49"} +{"current_steps": 4780, "total_steps": 7064, "loss": 0.7859, "reward": null, "learning_rate": 1.1835303742493508e-05, "epoch": 1.35, "percentage": 67.67, "elapsed_time": "12:51:52", "remaining_time": "6:08:49"} +{"current_steps": 4780, "total_steps": 7064, "loss": 0.7859, "reward": null, "learning_rate": 1.1835303742493508e-05, "epoch": 1.35, "percentage": 67.67, "elapsed_time": "12:51:51", "remaining_time": "6:08:48"} +{"current_steps": 4790, "total_steps": 7064, "loss": 0.7897, "reward": null, "learning_rate": 1.1740915097824629e-05, "epoch": 1.36, "percentage": 67.81, "elapsed_time": "12:53:28", "remaining_time": "6:07:11"} +{"current_steps": 4790, "total_steps": 7064, "loss": 0.7897, "reward": null, "learning_rate": 1.1740915097824629e-05, "epoch": 1.36, "percentage": 67.81, "elapsed_time": "12:53:30", "remaining_time": "6:07:12"} +{"current_steps": 4790, "total_steps": 7064, "loss": 0.7897, "reward": null, "learning_rate": 1.1740915097824629e-05, "epoch": 1.36, "percentage": 67.81, "elapsed_time": "12:57:23", "remaining_time": "6:09:03"} +{"current_steps": 4790, "total_steps": 7064, "loss": 0.7897, "reward": null, "learning_rate": 1.1740915097824629e-05, "epoch": 1.36, "percentage": 67.81, "elapsed_time": "12:53:29", "remaining_time": "6:07:12"} +{"current_steps": 4800, "total_steps": 7064, "loss": 0.768, "reward": null, "learning_rate": 1.1646788700561085e-05, "epoch": 1.36, "percentage": 67.95, "elapsed_time": "12:59:01", "remaining_time": "6:07:26"} +{"current_steps": 4800, "total_steps": 7064, "loss": 0.768, "reward": null, "learning_rate": 1.1646788700561085e-05, "epoch": 1.36, "percentage": 67.95, "elapsed_time": "12:55:06", "remaining_time": "6:05:35"} +{"current_steps": 4800, "total_steps": 7064, "loss": 0.768, "reward": null, "learning_rate": 1.1646788700561085e-05, "epoch": 1.36, "percentage": 67.95, "elapsed_time": "12:55:08", "remaining_time": "6:05:36"} +{"current_steps": 4800, "total_steps": 7064, "loss": 0.768, "reward": null, "learning_rate": 1.1646788700561085e-05, "epoch": 1.36, "percentage": 67.95, "elapsed_time": "12:55:07", "remaining_time": "6:05:36"} +{"current_steps": 4810, "total_steps": 7064, "loss": 0.7935, "reward": null, "learning_rate": 1.1552926412400225e-05, "epoch": 1.36, "percentage": 68.09, "elapsed_time": "12:56:43", "remaining_time": "6:03:58"} +{"current_steps": 4810, "total_steps": 7064, "loss": 0.7935, "reward": null, "learning_rate": 1.1552926412400225e-05, "epoch": 1.36, "percentage": 68.09, "elapsed_time": "13:00:37", "remaining_time": "6:05:48"} +{"current_steps": 4810, "total_steps": 7064, "loss": 0.7935, "reward": null, "learning_rate": 1.1552926412400225e-05, "epoch": 1.36, "percentage": 68.09, "elapsed_time": "12:56:42", "remaining_time": "6:03:58"} +{"current_steps": 4810, "total_steps": 7064, "loss": 0.7935, "reward": null, "learning_rate": 1.1552926412400225e-05, "epoch": 1.36, "percentage": 68.09, "elapsed_time": "12:56:44", "remaining_time": "6:03:59"} +{"current_steps": 4820, "total_steps": 7064, "loss": 0.7933, "reward": null, "learning_rate": 1.1459330089815699e-05, "epoch": 1.36, "percentage": 68.23, "elapsed_time": "12:58:21", "remaining_time": "6:02:22"} +{"current_steps": 4820, "total_steps": 7064, "loss": 0.7933, "reward": null, "learning_rate": 1.1459330089815699e-05, "epoch": 1.36, "percentage": 68.23, "elapsed_time": "12:58:22", "remaining_time": "6:02:22"} +{"current_steps": 4820, "total_steps": 7064, "loss": 0.7933, "reward": null, "learning_rate": 1.1459330089815699e-05, "epoch": 1.36, "percentage": 68.23, "elapsed_time": "13:02:16", "remaining_time": "6:04:11"} +{"current_steps": 4820, "total_steps": 7064, "loss": 0.7933, "reward": null, "learning_rate": 1.1459330089815699e-05, "epoch": 1.36, "percentage": 68.23, "elapsed_time": "12:58:23", "remaining_time": "6:02:23"} +{"current_steps": 4830, "total_steps": 7064, "loss": 0.7792, "reward": null, "learning_rate": 1.136600158402068e-05, "epoch": 1.37, "percentage": 68.37, "elapsed_time": "13:03:55", "remaining_time": "6:02:35"} +{"current_steps": 4830, "total_steps": 7064, "loss": 0.7792, "reward": null, "learning_rate": 1.136600158402068e-05, "epoch": 1.37, "percentage": 68.37, "elapsed_time": "13:00:01", "remaining_time": "6:00:46"} +{"current_steps": 4830, "total_steps": 7064, "loss": 0.7792, "reward": null, "learning_rate": 1.136600158402068e-05, "epoch": 1.37, "percentage": 68.37, "elapsed_time": "13:00:02", "remaining_time": "6:00:47"} +{"current_steps": 4830, "total_steps": 7064, "loss": 0.7792, "reward": null, "learning_rate": 1.136600158402068e-05, "epoch": 1.37, "percentage": 68.37, "elapsed_time": "13:00:02", "remaining_time": "6:00:47"} +{"current_steps": 4840, "total_steps": 7064, "loss": 0.7839, "reward": null, "learning_rate": 1.1272942740931286e-05, "epoch": 1.37, "percentage": 68.52, "elapsed_time": "13:01:43", "remaining_time": "5:59:12"} +{"current_steps": 4840, "total_steps": 7064, "loss": 0.7839, "reward": null, "learning_rate": 1.1272942740931286e-05, "epoch": 1.37, "percentage": 68.52, "elapsed_time": "13:05:37", "remaining_time": "6:00:59"} +{"current_steps": 4840, "total_steps": 7064, "loss": 0.7839, "reward": null, "learning_rate": 1.1272942740931286e-05, "epoch": 1.37, "percentage": 68.52, "elapsed_time": "13:01:44", "remaining_time": "5:59:12"} +{"current_steps": 4840, "total_steps": 7064, "loss": 0.7839, "reward": null, "learning_rate": 1.1272942740931286e-05, "epoch": 1.37, "percentage": 68.52, "elapsed_time": "13:01:42", "remaining_time": "5:59:12"} +{"current_steps": 4850, "total_steps": 7064, "loss": 0.7844, "reward": null, "learning_rate": 1.1180155401130044e-05, "epoch": 1.37, "percentage": 68.66, "elapsed_time": "13:03:23", "remaining_time": "5:57:36"} +{"current_steps": 4850, "total_steps": 7064, "loss": 0.7844, "reward": null, "learning_rate": 1.1180155401130044e-05, "epoch": 1.37, "percentage": 68.66, "elapsed_time": "13:07:17", "remaining_time": "5:59:23"} +{"current_steps": 4850, "total_steps": 7064, "loss": 0.7844, "reward": null, "learning_rate": 1.1180155401130044e-05, "epoch": 1.37, "percentage": 68.66, "elapsed_time": "13:03:24", "remaining_time": "5:57:37"} +{"current_steps": 4850, "total_steps": 7064, "loss": 0.7844, "reward": null, "learning_rate": 1.1180155401130044e-05, "epoch": 1.37, "percentage": 68.66, "elapsed_time": "13:03:22", "remaining_time": "5:57:36"} +{"current_steps": 4860, "total_steps": 7064, "loss": 0.7753, "reward": null, "learning_rate": 1.1087641399829527e-05, "epoch": 1.38, "percentage": 68.8, "elapsed_time": "13:08:54", "remaining_time": "5:57:46"} +{"current_steps": 4860, "total_steps": 7064, "loss": 0.7753, "reward": null, "learning_rate": 1.1087641399829527e-05, "epoch": 1.38, "percentage": 68.8, "elapsed_time": "13:05:01", "remaining_time": "5:56:00"} +{"current_steps": 4860, "total_steps": 7064, "loss": 0.7753, "reward": null, "learning_rate": 1.1087641399829527e-05, "epoch": 1.38, "percentage": 68.8, "elapsed_time": "13:05:00", "remaining_time": "5:56:00"} +{"current_steps": 4860, "total_steps": 7064, "loss": 0.7753, "reward": null, "learning_rate": 1.1087641399829527e-05, "epoch": 1.38, "percentage": 68.8, "elapsed_time": "13:04:59", "remaining_time": "5:55:59"} +{"current_steps": 4870, "total_steps": 7064, "loss": 0.791, "reward": null, "learning_rate": 1.0995402566835997e-05, "epoch": 1.38, "percentage": 68.94, "elapsed_time": "13:06:34", "remaining_time": "5:54:21"} +{"current_steps": 4870, "total_steps": 7064, "loss": 0.791, "reward": null, "learning_rate": 1.0995402566835997e-05, "epoch": 1.38, "percentage": 68.94, "elapsed_time": "13:06:33", "remaining_time": "5:54:21"} +{"current_steps": 4870, "total_steps": 7064, "loss": 0.791, "reward": null, "learning_rate": 1.0995402566835997e-05, "epoch": 1.38, "percentage": 68.94, "elapsed_time": "13:10:28", "remaining_time": "5:56:07"} +{"current_steps": 4870, "total_steps": 7064, "loss": 0.791, "reward": null, "learning_rate": 1.0995402566835997e-05, "epoch": 1.38, "percentage": 68.94, "elapsed_time": "13:06:35", "remaining_time": "5:54:22"} +{"current_steps": 4880, "total_steps": 7064, "loss": 0.7998, "reward": null, "learning_rate": 1.090344072651328e-05, "epoch": 1.38, "percentage": 69.08, "elapsed_time": "13:12:06", "remaining_time": "5:54:30"} +{"current_steps": 4880, "total_steps": 7064, "loss": 0.7998, "reward": null, "learning_rate": 1.090344072651328e-05, "epoch": 1.38, "percentage": 69.08, "elapsed_time": "13:08:13", "remaining_time": "5:52:45"} +{"current_steps": 4880, "total_steps": 7064, "loss": 0.7998, "reward": null, "learning_rate": 1.090344072651328e-05, "epoch": 1.38, "percentage": 69.08, "elapsed_time": "13:08:14", "remaining_time": "5:52:46"} +{"current_steps": 4880, "total_steps": 7064, "loss": 0.7998, "reward": null, "learning_rate": 1.090344072651328e-05, "epoch": 1.38, "percentage": 69.08, "elapsed_time": "13:08:12", "remaining_time": "5:52:45"} +{"current_steps": 4890, "total_steps": 7064, "loss": 0.7864, "reward": null, "learning_rate": 1.0811757697746614e-05, "epoch": 1.38, "percentage": 69.22, "elapsed_time": "13:13:44", "remaining_time": "5:52:52"} +{"current_steps": 4890, "total_steps": 7064, "loss": 0.7864, "reward": null, "learning_rate": 1.0811757697746614e-05, "epoch": 1.38, "percentage": 69.22, "elapsed_time": "13:09:51", "remaining_time": "5:51:09"} +{"current_steps": 4890, "total_steps": 7064, "loss": 0.7864, "reward": null, "learning_rate": 1.0811757697746614e-05, "epoch": 1.38, "percentage": 69.22, "elapsed_time": "13:09:50", "remaining_time": "5:51:09"} +{"current_steps": 4890, "total_steps": 7064, "loss": 0.7864, "reward": null, "learning_rate": 1.0811757697746614e-05, "epoch": 1.38, "percentage": 69.22, "elapsed_time": "13:09:49", "remaining_time": "5:51:08"} +{"current_steps": 4900, "total_steps": 7064, "loss": 0.7702, "reward": null, "learning_rate": 1.0720355293906741e-05, "epoch": 1.39, "percentage": 69.37, "elapsed_time": "13:15:20", "remaining_time": "5:51:14"} +{"current_steps": 4900, "total_steps": 7064, "loss": 0.7702, "reward": null, "learning_rate": 1.0720355293906741e-05, "epoch": 1.39, "percentage": 69.37, "elapsed_time": "13:11:25", "remaining_time": "5:49:31"} +{"current_steps": 4900, "total_steps": 7064, "loss": 0.7702, "reward": null, "learning_rate": 1.0720355293906741e-05, "epoch": 1.39, "percentage": 69.37, "elapsed_time": "13:11:27", "remaining_time": "5:49:32"} +{"current_steps": 4900, "total_steps": 7064, "loss": 0.7702, "reward": null, "learning_rate": 1.0720355293906741e-05, "epoch": 1.39, "percentage": 69.37, "elapsed_time": "13:11:26", "remaining_time": "5:49:31"} +{"current_steps": 4910, "total_steps": 7064, "loss": 0.7705, "reward": null, "learning_rate": 1.0629235322813982e-05, "epoch": 1.39, "percentage": 69.51, "elapsed_time": "13:13:03", "remaining_time": "5:47:54"} +{"current_steps": 4910, "total_steps": 7064, "loss": 0.7705, "reward": null, "learning_rate": 1.0629235322813982e-05, "epoch": 1.39, "percentage": 69.51, "elapsed_time": "13:16:57", "remaining_time": "5:49:37"} +{"current_steps": 4910, "total_steps": 7064, "loss": 0.7705, "reward": null, "learning_rate": 1.0629235322813982e-05, "epoch": 1.39, "percentage": 69.51, "elapsed_time": "13:13:04", "remaining_time": "5:47:55"} +{"current_steps": 4910, "total_steps": 7064, "loss": 0.7705, "reward": null, "learning_rate": 1.0629235322813982e-05, "epoch": 1.39, "percentage": 69.51, "elapsed_time": "13:13:03", "remaining_time": "5:47:54"} +{"current_steps": 4920, "total_steps": 7064, "loss": 0.7941, "reward": null, "learning_rate": 1.0538399586702507e-05, "epoch": 1.39, "percentage": 69.65, "elapsed_time": "13:18:35", "remaining_time": "5:48:00"} +{"current_steps": 4920, "total_steps": 7064, "loss": 0.7941, "reward": null, "learning_rate": 1.0538399586702507e-05, "epoch": 1.39, "percentage": 69.65, "elapsed_time": "13:14:42", "remaining_time": "5:46:18"} +{"current_steps": 4920, "total_steps": 7064, "loss": 0.7941, "reward": null, "learning_rate": 1.0538399586702507e-05, "epoch": 1.39, "percentage": 69.65, "elapsed_time": "13:14:43", "remaining_time": "5:46:18"} +{"current_steps": 4920, "total_steps": 7064, "loss": 0.7941, "reward": null, "learning_rate": 1.0538399586702507e-05, "epoch": 1.39, "percentage": 69.65, "elapsed_time": "13:14:41", "remaining_time": "5:46:18"} +{"current_steps": 4930, "total_steps": 7064, "loss": 0.7779, "reward": null, "learning_rate": 1.0447849882184715e-05, "epoch": 1.4, "percentage": 69.79, "elapsed_time": "13:20:15", "remaining_time": "5:46:23"} +{"current_steps": 4930, "total_steps": 7064, "loss": 0.7779, "reward": null, "learning_rate": 1.0447849882184715e-05, "epoch": 1.4, "percentage": 69.79, "elapsed_time": "13:16:22", "remaining_time": "5:44:43"} +{"current_steps": 4930, "total_steps": 7064, "loss": 0.7779, "reward": null, "learning_rate": 1.0447849882184715e-05, "epoch": 1.4, "percentage": 69.79, "elapsed_time": "13:16:21", "remaining_time": "5:44:42"} +{"current_steps": 4930, "total_steps": 7064, "loss": 0.7779, "reward": null, "learning_rate": 1.0447849882184715e-05, "epoch": 1.4, "percentage": 69.79, "elapsed_time": "13:16:20", "remaining_time": "5:44:42"} +{"current_steps": 4940, "total_steps": 7064, "loss": 0.7755, "reward": null, "learning_rate": 1.035758800021564e-05, "epoch": 1.4, "percentage": 69.93, "elapsed_time": "13:17:57", "remaining_time": "5:43:05"} +{"current_steps": 4940, "total_steps": 7064, "loss": 0.7755, "reward": null, "learning_rate": 1.035758800021564e-05, "epoch": 1.4, "percentage": 69.93, "elapsed_time": "13:21:51", "remaining_time": "5:44:45"} +{"current_steps": 4940, "total_steps": 7064, "loss": 0.7755, "reward": null, "learning_rate": 1.035758800021564e-05, "epoch": 1.4, "percentage": 69.93, "elapsed_time": "13:17:58", "remaining_time": "5:43:05"} +{"current_steps": 4940, "total_steps": 7064, "loss": 0.7755, "reward": null, "learning_rate": 1.035758800021564e-05, "epoch": 1.4, "percentage": 69.93, "elapsed_time": "13:17:56", "remaining_time": "5:43:05"} +{"current_steps": 4950, "total_steps": 7064, "loss": 0.7825, "reward": null, "learning_rate": 1.0267615726057592e-05, "epoch": 1.4, "percentage": 70.07, "elapsed_time": "13:19:34", "remaining_time": "5:41:28"} +{"current_steps": 4950, "total_steps": 7064, "loss": 0.7825, "reward": null, "learning_rate": 1.0267615726057592e-05, "epoch": 1.4, "percentage": 70.07, "elapsed_time": "13:23:29", "remaining_time": "5:43:08"} +{"current_steps": 4950, "total_steps": 7064, "loss": 0.7825, "reward": null, "learning_rate": 1.0267615726057592e-05, "epoch": 1.4, "percentage": 70.07, "elapsed_time": "13:19:36", "remaining_time": "5:41:29"} +{"current_steps": 4950, "total_steps": 7064, "loss": 0.7825, "reward": null, "learning_rate": 1.0267615726057592e-05, "epoch": 1.4, "percentage": 70.07, "elapsed_time": "13:19:35", "remaining_time": "5:41:29"} +{"current_steps": 4960, "total_steps": 7064, "loss": 0.7983, "reward": null, "learning_rate": 1.0177934839244787e-05, "epoch": 1.4, "percentage": 70.22, "elapsed_time": "13:21:11", "remaining_time": "5:39:51"} +{"current_steps": 4960, "total_steps": 7064, "loss": 0.7983, "reward": null, "learning_rate": 1.0177934839244787e-05, "epoch": 1.4, "percentage": 70.22, "elapsed_time": "13:21:12", "remaining_time": "5:39:52"} +{"current_steps": 4960, "total_steps": 7064, "loss": 0.7983, "reward": null, "learning_rate": 1.0177934839244787e-05, "epoch": 1.4, "percentage": 70.22, "elapsed_time": "13:21:13", "remaining_time": "5:39:52"} +{"current_steps": 4960, "total_steps": 7064, "loss": 0.7983, "reward": null, "learning_rate": 1.0177934839244787e-05, "epoch": 1.4, "percentage": 70.22, "elapsed_time": "13:25:06", "remaining_time": "5:41:31"} +{"current_steps": 4970, "total_steps": 7064, "loss": 0.773, "reward": null, "learning_rate": 1.0088547113548211e-05, "epoch": 1.41, "percentage": 70.36, "elapsed_time": "13:22:50", "remaining_time": "5:38:15"} +{"current_steps": 4970, "total_steps": 7064, "loss": 0.773, "reward": null, "learning_rate": 1.0088547113548211e-05, "epoch": 1.41, "percentage": 70.36, "elapsed_time": "13:26:43", "remaining_time": "5:39:53"} +{"current_steps": 4970, "total_steps": 7064, "loss": 0.773, "reward": null, "learning_rate": 1.0088547113548211e-05, "epoch": 1.41, "percentage": 70.36, "elapsed_time": "13:22:51", "remaining_time": "5:38:15"} +{"current_steps": 4970, "total_steps": 7064, "loss": 0.773, "reward": null, "learning_rate": 1.0088547113548211e-05, "epoch": 1.41, "percentage": 70.36, "elapsed_time": "13:22:49", "remaining_time": "5:38:15"} +{"current_steps": 4980, "total_steps": 7064, "loss": 0.7794, "reward": null, "learning_rate": 9.99945431694048e-06, "epoch": 1.41, "percentage": 70.5, "elapsed_time": "13:28:24", "remaining_time": "5:38:18"} +{"current_steps": 4980, "total_steps": 7064, "loss": 0.7794, "reward": null, "learning_rate": 9.99945431694048e-06, "epoch": 1.41, "percentage": 70.5, "elapsed_time": "13:24:32", "remaining_time": "5:36:40"} +{"current_steps": 4980, "total_steps": 7064, "loss": 0.7794, "reward": null, "learning_rate": 9.99945431694048e-06, "epoch": 1.41, "percentage": 70.5, "elapsed_time": "13:24:31", "remaining_time": "5:36:40"} +{"current_steps": 4980, "total_steps": 7064, "loss": 0.7794, "reward": null, "learning_rate": 9.99945431694048e-06, "epoch": 1.41, "percentage": 70.5, "elapsed_time": "13:24:30", "remaining_time": "5:36:39"} +{"current_steps": 4990, "total_steps": 7064, "loss": 0.7889, "reward": null, "learning_rate": 9.910658211560902e-06, "epoch": 1.41, "percentage": 70.64, "elapsed_time": "13:26:08", "remaining_time": "5:35:03"} +{"current_steps": 4990, "total_steps": 7064, "loss": 0.7889, "reward": null, "learning_rate": 9.910658211560902e-06, "epoch": 1.41, "percentage": 70.64, "elapsed_time": "13:26:08", "remaining_time": "5:35:03"} +{"current_steps": 4990, "total_steps": 7064, "loss": 0.7889, "reward": null, "learning_rate": 9.910658211560902e-06, "epoch": 1.41, "percentage": 70.64, "elapsed_time": "13:30:01", "remaining_time": "5:36:40"} +{"current_steps": 4990, "total_steps": 7064, "loss": 0.7889, "reward": null, "learning_rate": 9.910658211560902e-06, "epoch": 1.41, "percentage": 70.64, "elapsed_time": "13:26:07", "remaining_time": "5:35:02"} +{"current_steps": 5000, "total_steps": 7064, "loss": 0.7809, "reward": null, "learning_rate": 9.822160553680617e-06, "epoch": 1.42, "percentage": 70.78, "elapsed_time": "13:27:50", "remaining_time": "5:33:28"} +{"current_steps": 5000, "total_steps": 7064, "loss": 0.7809, "reward": null, "learning_rate": 9.822160553680617e-06, "epoch": 1.42, "percentage": 70.78, "elapsed_time": "13:27:50", "remaining_time": "5:33:28"} +{"current_steps": 5000, "total_steps": 7064, "loss": 0.7809, "reward": null, "learning_rate": 9.822160553680617e-06, "epoch": 1.42, "percentage": 70.78, "elapsed_time": "13:31:44", "remaining_time": "5:35:05"} +{"current_steps": 5000, "total_steps": 7064, "loss": 0.7809, "reward": null, "learning_rate": 9.822160553680617e-06, "epoch": 1.42, "percentage": 70.78, "elapsed_time": "13:27:51", "remaining_time": "5:33:29"} +{"current_steps": 5010, "total_steps": 7064, "loss": 0.7624, "reward": null, "learning_rate": 9.733963093667889e-06, "epoch": 1.42, "percentage": 70.92, "elapsed_time": "13:33:22", "remaining_time": "5:33:28"} +{"current_steps": 5010, "total_steps": 7064, "loss": 0.7624, "reward": null, "learning_rate": 9.733963093667889e-06, "epoch": 1.42, "percentage": 70.92, "elapsed_time": "13:29:29", "remaining_time": "5:31:52"} +{"current_steps": 5010, "total_steps": 7064, "loss": 0.7624, "reward": null, "learning_rate": 9.733963093667889e-06, "epoch": 1.42, "percentage": 70.92, "elapsed_time": "13:29:28", "remaining_time": "5:31:52"} +{"current_steps": 5010, "total_steps": 7064, "loss": 0.7624, "reward": null, "learning_rate": 9.733963093667889e-06, "epoch": 1.42, "percentage": 70.92, "elapsed_time": "13:29:29", "remaining_time": "5:31:52"} +{"current_steps": 5020, "total_steps": 7064, "loss": 0.7787, "reward": null, "learning_rate": 9.646067575953419e-06, "epoch": 1.42, "percentage": 71.06, "elapsed_time": "13:31:05", "remaining_time": "5:30:15"} +{"current_steps": 5020, "total_steps": 7064, "loss": 0.7787, "reward": null, "learning_rate": 9.646067575953419e-06, "epoch": 1.42, "percentage": 71.06, "elapsed_time": "13:34:59", "remaining_time": "5:31:50"} +{"current_steps": 5020, "total_steps": 7064, "loss": 0.7787, "reward": null, "learning_rate": 9.646067575953419e-06, "epoch": 1.42, "percentage": 71.06, "elapsed_time": "13:31:06", "remaining_time": "5:30:15"} +{"current_steps": 5020, "total_steps": 7064, "loss": 0.7787, "reward": null, "learning_rate": 9.646067575953419e-06, "epoch": 1.42, "percentage": 71.06, "elapsed_time": "13:31:06", "remaining_time": "5:30:15"} +{"current_steps": 5030, "total_steps": 7064, "loss": 0.775, "reward": null, "learning_rate": 9.558475738995923e-06, "epoch": 1.42, "percentage": 71.21, "elapsed_time": "13:32:45", "remaining_time": "5:28:39"} +{"current_steps": 5030, "total_steps": 7064, "loss": 0.775, "reward": null, "learning_rate": 9.558475738995923e-06, "epoch": 1.42, "percentage": 71.21, "elapsed_time": "13:32:46", "remaining_time": "5:28:39"} +{"current_steps": 5030, "total_steps": 7064, "loss": 0.775, "reward": null, "learning_rate": 9.558475738995923e-06, "epoch": 1.42, "percentage": 71.21, "elapsed_time": "13:36:39", "remaining_time": "5:30:14"} +{"current_steps": 5030, "total_steps": 7064, "loss": 0.775, "reward": null, "learning_rate": 9.558475738995923e-06, "epoch": 1.42, "percentage": 71.21, "elapsed_time": "13:32:44", "remaining_time": "5:28:39"} +{"current_steps": 5040, "total_steps": 7064, "loss": 0.7607, "reward": null, "learning_rate": 9.471189315247669e-06, "epoch": 1.43, "percentage": 71.35, "elapsed_time": "13:34:23", "remaining_time": "5:27:02"} +{"current_steps": 5040, "total_steps": 7064, "loss": 0.7607, "reward": null, "learning_rate": 9.471189315247669e-06, "epoch": 1.43, "percentage": 71.35, "elapsed_time": "13:34:24", "remaining_time": "5:27:03"} +{"current_steps": 5040, "total_steps": 7064, "loss": 0.7607, "reward": null, "learning_rate": 9.471189315247669e-06, "epoch": 1.43, "percentage": 71.35, "elapsed_time": "13:34:24", "remaining_time": "5:27:03"} +{"current_steps": 5040, "total_steps": 7064, "loss": 0.7607, "reward": null, "learning_rate": 9.471189315247669e-06, "epoch": 1.43, "percentage": 71.35, "elapsed_time": "13:38:17", "remaining_time": "5:28:37"} +{"current_steps": 5050, "total_steps": 7064, "loss": 0.7795, "reward": null, "learning_rate": 9.384210031120288e-06, "epoch": 1.43, "percentage": 71.49, "elapsed_time": "13:36:02", "remaining_time": "5:25:26"} +{"current_steps": 5050, "total_steps": 7064, "loss": 0.7795, "reward": null, "learning_rate": 9.384210031120288e-06, "epoch": 1.43, "percentage": 71.49, "elapsed_time": "13:39:57", "remaining_time": "5:27:00"} +{"current_steps": 5050, "total_steps": 7064, "loss": 0.7795, "reward": null, "learning_rate": 9.384210031120288e-06, "epoch": 1.43, "percentage": 71.49, "elapsed_time": "13:36:03", "remaining_time": "5:25:27"} +{"current_steps": 5050, "total_steps": 7064, "loss": 0.7795, "reward": null, "learning_rate": 9.384210031120288e-06, "epoch": 1.43, "percentage": 71.49, "elapsed_time": "13:36:04", "remaining_time": "5:25:27"} +{"current_steps": 5060, "total_steps": 7064, "loss": 0.7933, "reward": null, "learning_rate": 9.297539606950564e-06, "epoch": 1.43, "percentage": 71.63, "elapsed_time": "13:37:40", "remaining_time": "5:23:50"} +{"current_steps": 5060, "total_steps": 7064, "loss": 0.7933, "reward": null, "learning_rate": 9.297539606950564e-06, "epoch": 1.43, "percentage": 71.63, "elapsed_time": "13:41:35", "remaining_time": "5:25:23"} +{"current_steps": 5060, "total_steps": 7064, "loss": 0.7933, "reward": null, "learning_rate": 9.297539606950564e-06, "epoch": 1.43, "percentage": 71.63, "elapsed_time": "13:37:42", "remaining_time": "5:23:51"} +{"current_steps": 5060, "total_steps": 7064, "loss": 0.7933, "reward": null, "learning_rate": 9.297539606950564e-06, "epoch": 1.43, "percentage": 71.63, "elapsed_time": "13:37:41", "remaining_time": "5:23:50"} +{"current_steps": 5070, "total_steps": 7064, "loss": 0.7859, "reward": null, "learning_rate": 9.21117975696644e-06, "epoch": 1.44, "percentage": 71.77, "elapsed_time": "13:43:13", "remaining_time": "5:23:46"} +{"current_steps": 5070, "total_steps": 7064, "loss": 0.7859, "reward": null, "learning_rate": 9.21117975696644e-06, "epoch": 1.44, "percentage": 71.77, "elapsed_time": "13:39:20", "remaining_time": "5:22:14"} +{"current_steps": 5070, "total_steps": 7064, "loss": 0.7859, "reward": null, "learning_rate": 9.21117975696644e-06, "epoch": 1.44, "percentage": 71.77, "elapsed_time": "13:39:19", "remaining_time": "5:22:14"} +{"current_steps": 5070, "total_steps": 7064, "loss": 0.7859, "reward": null, "learning_rate": 9.21117975696644e-06, "epoch": 1.44, "percentage": 71.77, "elapsed_time": "13:39:18", "remaining_time": "5:22:13"} +{"current_steps": 5080, "total_steps": 7064, "loss": 0.7772, "reward": null, "learning_rate": 9.1251321892531e-06, "epoch": 1.44, "percentage": 71.91, "elapsed_time": "13:40:55", "remaining_time": "5:20:36"} +{"current_steps": 5080, "total_steps": 7064, "loss": 0.7772, "reward": null, "learning_rate": 9.1251321892531e-06, "epoch": 1.44, "percentage": 71.91, "elapsed_time": "13:40:56", "remaining_time": "5:20:37"} +{"current_steps": 5080, "total_steps": 7064, "loss": 0.7772, "reward": null, "learning_rate": 9.1251321892531e-06, "epoch": 1.44, "percentage": 71.91, "elapsed_time": "13:44:50", "remaining_time": "5:22:08"} +{"current_steps": 5080, "total_steps": 7064, "loss": 0.7772, "reward": null, "learning_rate": 9.1251321892531e-06, "epoch": 1.44, "percentage": 71.91, "elapsed_time": "13:40:57", "remaining_time": "5:20:37"} +{"current_steps": 5090, "total_steps": 7064, "loss": 0.7833, "reward": null, "learning_rate": 9.039398605719215e-06, "epoch": 1.44, "percentage": 72.06, "elapsed_time": "13:42:34", "remaining_time": "5:19:00"} +{"current_steps": 5090, "total_steps": 7064, "loss": 0.7833, "reward": null, "learning_rate": 9.039398605719215e-06, "epoch": 1.44, "percentage": 72.06, "elapsed_time": "13:42:35", "remaining_time": "5:19:01"} +{"current_steps": 5090, "total_steps": 7064, "loss": 0.7833, "reward": null, "learning_rate": 9.039398605719215e-06, "epoch": 1.44, "percentage": 72.06, "elapsed_time": "13:42:36", "remaining_time": "5:19:01"} +{"current_steps": 5090, "total_steps": 7064, "loss": 0.7833, "reward": null, "learning_rate": 9.039398605719215e-06, "epoch": 1.44, "percentage": 72.06, "elapsed_time": "13:46:29", "remaining_time": "5:20:31"} +{"current_steps": 5100, "total_steps": 7064, "loss": 0.7784, "reward": null, "learning_rate": 8.953980702063233e-06, "epoch": 1.44, "percentage": 72.2, "elapsed_time": "13:48:04", "remaining_time": "5:18:53"} +{"current_steps": 5100, "total_steps": 7064, "loss": 0.7784, "reward": null, "learning_rate": 8.953980702063233e-06, "epoch": 1.44, "percentage": 72.2, "elapsed_time": "13:44:10", "remaining_time": "5:17:23"} +{"current_steps": 5100, "total_steps": 7064, "loss": 0.7784, "reward": null, "learning_rate": 8.953980702063233e-06, "epoch": 1.44, "percentage": 72.2, "elapsed_time": "13:44:11", "remaining_time": "5:17:23"} +{"current_steps": 5100, "total_steps": 7064, "loss": 0.7784, "reward": null, "learning_rate": 8.953980702063233e-06, "epoch": 1.44, "percentage": 72.2, "elapsed_time": "13:44:09", "remaining_time": "5:17:23"} +{"current_steps": 5110, "total_steps": 7064, "loss": 0.7835, "reward": null, "learning_rate": 8.868880167739887e-06, "epoch": 1.45, "percentage": 72.34, "elapsed_time": "13:45:49", "remaining_time": "5:15:47"} +{"current_steps": 5110, "total_steps": 7064, "loss": 0.7835, "reward": null, "learning_rate": 8.868880167739887e-06, "epoch": 1.45, "percentage": 72.34, "elapsed_time": "13:45:48", "remaining_time": "5:15:46"} +{"current_steps": 5110, "total_steps": 7064, "loss": 0.7835, "reward": null, "learning_rate": 8.868880167739887e-06, "epoch": 1.45, "percentage": 72.34, "elapsed_time": "13:45:50", "remaining_time": "5:15:47"} +{"current_steps": 5110, "total_steps": 7064, "loss": 0.7835, "reward": null, "learning_rate": 8.868880167739887e-06, "epoch": 1.45, "percentage": 72.34, "elapsed_time": "13:49:43", "remaining_time": "5:17:16"} +{"current_steps": 5120, "total_steps": 7064, "loss": 0.779, "reward": null, "learning_rate": 8.784098685926734e-06, "epoch": 1.45, "percentage": 72.48, "elapsed_time": "13:47:24", "remaining_time": "5:14:09"} +{"current_steps": 5120, "total_steps": 7064, "loss": 0.779, "reward": null, "learning_rate": 8.784098685926734e-06, "epoch": 1.45, "percentage": 72.48, "elapsed_time": "13:47:26", "remaining_time": "5:14:10"} +{"current_steps": 5120, "total_steps": 7064, "loss": 0.779, "reward": null, "learning_rate": 8.784098685926734e-06, "epoch": 1.45, "percentage": 72.48, "elapsed_time": "13:47:25", "remaining_time": "5:14:09"} +{"current_steps": 5120, "total_steps": 7064, "loss": 0.779, "reward": null, "learning_rate": 8.784098685926734e-06, "epoch": 1.45, "percentage": 72.48, "elapsed_time": "13:51:19", "remaining_time": "5:15:38"} +{"current_steps": 5130, "total_steps": 7064, "loss": 0.7953, "reward": null, "learning_rate": 8.699637933490917e-06, "epoch": 1.45, "percentage": 72.62, "elapsed_time": "13:49:03", "remaining_time": "5:12:33"} +{"current_steps": 5130, "total_steps": 7064, "loss": 0.7953, "reward": null, "learning_rate": 8.699637933490917e-06, "epoch": 1.45, "percentage": 72.62, "elapsed_time": "13:52:58", "remaining_time": "5:14:01"} +{"current_steps": 5130, "total_steps": 7064, "loss": 0.7953, "reward": null, "learning_rate": 8.699637933490917e-06, "epoch": 1.45, "percentage": 72.62, "elapsed_time": "13:49:04", "remaining_time": "5:12:33"} +{"current_steps": 5130, "total_steps": 7064, "loss": 0.7953, "reward": null, "learning_rate": 8.699637933490917e-06, "epoch": 1.45, "percentage": 72.62, "elapsed_time": "13:49:05", "remaining_time": "5:12:33"} +{"current_steps": 5140, "total_steps": 7064, "loss": 0.773, "reward": null, "learning_rate": 8.615499580955953e-06, "epoch": 1.46, "percentage": 72.76, "elapsed_time": "13:54:31", "remaining_time": "5:12:22"} +{"current_steps": 5140, "total_steps": 7064, "loss": 0.773, "reward": null, "learning_rate": 8.615499580955953e-06, "epoch": 1.46, "percentage": 72.76, "elapsed_time": "13:50:36", "remaining_time": "5:10:54"} +{"current_steps": 5140, "total_steps": 7064, "loss": 0.773, "reward": null, "learning_rate": 8.615499580955953e-06, "epoch": 1.46, "percentage": 72.76, "elapsed_time": "13:50:38", "remaining_time": "5:10:55"} +{"current_steps": 5140, "total_steps": 7064, "loss": 0.773, "reward": null, "learning_rate": 8.615499580955953e-06, "epoch": 1.46, "percentage": 72.76, "elapsed_time": "13:50:37", "remaining_time": "5:10:55"} +{"current_steps": 5150, "total_steps": 7064, "loss": 0.7851, "reward": null, "learning_rate": 8.531685292468693e-06, "epoch": 1.46, "percentage": 72.9, "elapsed_time": "13:52:17", "remaining_time": "5:09:19"} +{"current_steps": 5150, "total_steps": 7064, "loss": 0.7851, "reward": null, "learning_rate": 8.531685292468693e-06, "epoch": 1.46, "percentage": 72.9, "elapsed_time": "13:52:18", "remaining_time": "5:09:19"} +{"current_steps": 5150, "total_steps": 7064, "loss": 0.7851, "reward": null, "learning_rate": 8.531685292468693e-06, "epoch": 1.46, "percentage": 72.9, "elapsed_time": "13:52:18", "remaining_time": "5:09:19"} +{"current_steps": 5150, "total_steps": 7064, "loss": 0.7851, "reward": null, "learning_rate": 8.531685292468693e-06, "epoch": 1.46, "percentage": 72.9, "elapsed_time": "13:56:11", "remaining_time": "5:10:46"} +{"current_steps": 5160, "total_steps": 7064, "loss": 0.7903, "reward": null, "learning_rate": 8.448196725766471e-06, "epoch": 1.46, "percentage": 73.05, "elapsed_time": "13:53:57", "remaining_time": "5:07:43"} +{"current_steps": 5160, "total_steps": 7064, "loss": 0.7903, "reward": null, "learning_rate": 8.448196725766471e-06, "epoch": 1.46, "percentage": 73.05, "elapsed_time": "13:57:50", "remaining_time": "5:09:09"} +{"current_steps": 5160, "total_steps": 7064, "loss": 0.7903, "reward": null, "learning_rate": 8.448196725766471e-06, "epoch": 1.46, "percentage": 73.05, "elapsed_time": "13:53:57", "remaining_time": "5:07:43"} +{"current_steps": 5160, "total_steps": 7064, "loss": 0.7903, "reward": null, "learning_rate": 8.448196725766471e-06, "epoch": 1.46, "percentage": 73.05, "elapsed_time": "13:53:56", "remaining_time": "5:07:42"} +{"current_steps": 5170, "total_steps": 7064, "loss": 0.7822, "reward": null, "learning_rate": 8.365035532144217e-06, "epoch": 1.46, "percentage": 73.19, "elapsed_time": "13:59:26", "remaining_time": "5:07:31"} +{"current_steps": 5170, "total_steps": 7064, "loss": 0.7822, "reward": null, "learning_rate": 8.365035532144217e-06, "epoch": 1.46, "percentage": 73.19, "elapsed_time": "13:55:31", "remaining_time": "5:06:05"} +{"current_steps": 5170, "total_steps": 7064, "loss": 0.7822, "reward": null, "learning_rate": 8.365035532144217e-06, "epoch": 1.46, "percentage": 73.19, "elapsed_time": "13:55:32", "remaining_time": "5:06:05"} +{"current_steps": 5170, "total_steps": 7064, "loss": 0.7822, "reward": null, "learning_rate": 8.365035532144217e-06, "epoch": 1.46, "percentage": 73.19, "elapsed_time": "13:55:33", "remaining_time": "5:06:06"} +{"current_steps": 5180, "total_steps": 7064, "loss": 0.7887, "reward": null, "learning_rate": 8.282203356421891e-06, "epoch": 1.47, "percentage": 73.33, "elapsed_time": "13:57:12", "remaining_time": "5:04:29"} +{"current_steps": 5180, "total_steps": 7064, "loss": 0.7887, "reward": null, "learning_rate": 8.282203356421891e-06, "epoch": 1.47, "percentage": 73.33, "elapsed_time": "14:01:07", "remaining_time": "5:05:55"} +{"current_steps": 5180, "total_steps": 7064, "loss": 0.7887, "reward": null, "learning_rate": 8.282203356421891e-06, "epoch": 1.47, "percentage": 73.33, "elapsed_time": "13:57:14", "remaining_time": "5:04:30"} +{"current_steps": 5180, "total_steps": 7064, "loss": 0.7887, "reward": null, "learning_rate": 8.282203356421891e-06, "epoch": 1.47, "percentage": 73.33, "elapsed_time": "13:57:13", "remaining_time": "5:04:30"} +{"current_steps": 5190, "total_steps": 7064, "loss": 0.7972, "reward": null, "learning_rate": 8.199701836911877e-06, "epoch": 1.47, "percentage": 73.47, "elapsed_time": "13:58:48", "remaining_time": "5:02:52"} +{"current_steps": 5190, "total_steps": 7064, "loss": 0.7972, "reward": null, "learning_rate": 8.199701836911877e-06, "epoch": 1.47, "percentage": 73.47, "elapsed_time": "13:58:47", "remaining_time": "5:02:52"} +{"current_steps": 5190, "total_steps": 7064, "loss": 0.7972, "reward": null, "learning_rate": 8.199701836911877e-06, "epoch": 1.47, "percentage": 73.47, "elapsed_time": "13:58:49", "remaining_time": "5:02:52"} +{"current_steps": 5190, "total_steps": 7064, "loss": 0.7972, "reward": null, "learning_rate": 8.199701836911877e-06, "epoch": 1.47, "percentage": 73.47, "elapsed_time": "14:02:42", "remaining_time": "5:04:17"} +{"current_steps": 5200, "total_steps": 7064, "loss": 0.7781, "reward": null, "learning_rate": 8.117532605386632e-06, "epoch": 1.47, "percentage": 73.61, "elapsed_time": "14:00:26", "remaining_time": "5:01:15"} +{"current_steps": 5200, "total_steps": 7064, "loss": 0.7781, "reward": null, "learning_rate": 8.117532605386632e-06, "epoch": 1.47, "percentage": 73.61, "elapsed_time": "14:04:20", "remaining_time": "5:02:40"} +{"current_steps": 5200, "total_steps": 7064, "loss": 0.7781, "reward": null, "learning_rate": 8.117532605386632e-06, "epoch": 1.47, "percentage": 73.61, "elapsed_time": "14:00:27", "remaining_time": "5:01:16"} +{"current_steps": 5200, "total_steps": 7064, "loss": 0.7781, "reward": null, "learning_rate": 8.117532605386632e-06, "epoch": 1.47, "percentage": 73.61, "elapsed_time": "14:00:28", "remaining_time": "5:01:16"} +{"current_steps": 5210, "total_steps": 7064, "loss": 0.7885, "reward": null, "learning_rate": 8.035697287046376e-06, "epoch": 1.48, "percentage": 73.75, "elapsed_time": "14:02:02", "remaining_time": "4:59:38"} +{"current_steps": 5210, "total_steps": 7064, "loss": 0.7885, "reward": null, "learning_rate": 8.035697287046376e-06, "epoch": 1.48, "percentage": 73.75, "elapsed_time": "14:05:57", "remaining_time": "5:01:02"} +{"current_steps": 5210, "total_steps": 7064, "loss": 0.7885, "reward": null, "learning_rate": 8.035697287046376e-06, "epoch": 1.48, "percentage": 73.75, "elapsed_time": "14:02:04", "remaining_time": "4:59:39"} +{"current_steps": 5210, "total_steps": 7064, "loss": 0.7885, "reward": null, "learning_rate": 8.035697287046376e-06, "epoch": 1.48, "percentage": 73.75, "elapsed_time": "14:02:03", "remaining_time": "4:59:38"} +{"current_steps": 5220, "total_steps": 7064, "loss": 0.779, "reward": null, "learning_rate": 7.954197500486968e-06, "epoch": 1.48, "percentage": 73.9, "elapsed_time": "14:03:39", "remaining_time": "4:58:01"} +{"current_steps": 5220, "total_steps": 7064, "loss": 0.779, "reward": null, "learning_rate": 7.954197500486968e-06, "epoch": 1.48, "percentage": 73.9, "elapsed_time": "14:03:38", "remaining_time": "4:58:01"} +{"current_steps": 5220, "total_steps": 7064, "loss": 0.779, "reward": null, "learning_rate": 7.954197500486968e-06, "epoch": 1.48, "percentage": 73.9, "elapsed_time": "14:03:40", "remaining_time": "4:58:02"} +{"current_steps": 5220, "total_steps": 7064, "loss": 0.779, "reward": null, "learning_rate": 7.954197500486968e-06, "epoch": 1.48, "percentage": 73.9, "elapsed_time": "14:07:33", "remaining_time": "4:59:24"} +{"current_steps": 5230, "total_steps": 7064, "loss": 0.779, "reward": null, "learning_rate": 7.873034857667877e-06, "epoch": 1.48, "percentage": 74.04, "elapsed_time": "14:05:13", "remaining_time": "4:56:23"} +{"current_steps": 5230, "total_steps": 7064, "loss": 0.779, "reward": null, "learning_rate": 7.873034857667877e-06, "epoch": 1.48, "percentage": 74.04, "elapsed_time": "14:05:14", "remaining_time": "4:56:24"} +{"current_steps": 5230, "total_steps": 7064, "loss": 0.779, "reward": null, "learning_rate": 7.873034857667877e-06, "epoch": 1.48, "percentage": 74.04, "elapsed_time": "14:05:15", "remaining_time": "4:56:24"} +{"current_steps": 5230, "total_steps": 7064, "loss": 0.779, "reward": null, "learning_rate": 7.873034857667877e-06, "epoch": 1.48, "percentage": 74.04, "elapsed_time": "14:09:08", "remaining_time": "4:57:45"} +{"current_steps": 5240, "total_steps": 7064, "loss": 0.7883, "reward": null, "learning_rate": 7.792210963880328e-06, "epoch": 1.48, "percentage": 74.18, "elapsed_time": "14:10:44", "remaining_time": "4:56:08"} +{"current_steps": 5240, "total_steps": 7064, "loss": 0.7883, "reward": null, "learning_rate": 7.792210963880328e-06, "epoch": 1.48, "percentage": 74.18, "elapsed_time": "14:06:51", "remaining_time": "4:54:46"} +{"current_steps": 5240, "total_steps": 7064, "loss": 0.7883, "reward": null, "learning_rate": 7.792210963880328e-06, "epoch": 1.48, "percentage": 74.18, "elapsed_time": "14:06:50", "remaining_time": "4:54:46"} +{"current_steps": 5240, "total_steps": 7064, "loss": 0.7883, "reward": null, "learning_rate": 7.792210963880328e-06, "epoch": 1.48, "percentage": 74.18, "elapsed_time": "14:06:49", "remaining_time": "4:54:46"} +{"current_steps": 5250, "total_steps": 7064, "loss": 0.7677, "reward": null, "learning_rate": 7.711727417715509e-06, "epoch": 1.49, "percentage": 74.32, "elapsed_time": "14:12:23", "remaining_time": "4:54:31"} +{"current_steps": 5250, "total_steps": 7064, "loss": 0.7677, "reward": null, "learning_rate": 7.711727417715509e-06, "epoch": 1.49, "percentage": 74.32, "elapsed_time": "14:08:28", "remaining_time": "4:53:10"} +{"current_steps": 5250, "total_steps": 7064, "loss": 0.7677, "reward": null, "learning_rate": 7.711727417715509e-06, "epoch": 1.49, "percentage": 74.32, "elapsed_time": "14:08:29", "remaining_time": "4:53:10"} +{"current_steps": 5250, "total_steps": 7064, "loss": 0.7677, "reward": null, "learning_rate": 7.711727417715509e-06, "epoch": 1.49, "percentage": 74.32, "elapsed_time": "14:08:30", "remaining_time": "4:53:10"} +{"current_steps": 5260, "total_steps": 7064, "loss": 0.7849, "reward": null, "learning_rate": 7.631585811032999e-06, "epoch": 1.49, "percentage": 74.46, "elapsed_time": "14:10:09", "remaining_time": "4:51:34"} +{"current_steps": 5260, "total_steps": 7064, "loss": 0.7849, "reward": null, "learning_rate": 7.631585811032999e-06, "epoch": 1.49, "percentage": 74.46, "elapsed_time": "14:10:08", "remaining_time": "4:51:34"} +{"current_steps": 5260, "total_steps": 7064, "loss": 0.7849, "reward": null, "learning_rate": 7.631585811032999e-06, "epoch": 1.49, "percentage": 74.46, "elapsed_time": "14:14:03", "remaining_time": "4:52:54"} +{"current_steps": 5260, "total_steps": 7064, "loss": 0.7849, "reward": null, "learning_rate": 7.631585811032999e-06, "epoch": 1.49, "percentage": 74.46, "elapsed_time": "14:10:10", "remaining_time": "4:51:34"} +{"current_steps": 5270, "total_steps": 7064, "loss": 0.7707, "reward": null, "learning_rate": 7.551787728929236e-06, "epoch": 1.49, "percentage": 74.6, "elapsed_time": "14:15:38", "remaining_time": "4:51:16"} +{"current_steps": 5270, "total_steps": 7064, "loss": 0.7707, "reward": null, "learning_rate": 7.551787728929236e-06, "epoch": 1.49, "percentage": 74.6, "elapsed_time": "14:11:43", "remaining_time": "4:49:56"} +{"current_steps": 5270, "total_steps": 7064, "loss": 0.7707, "reward": null, "learning_rate": 7.551787728929236e-06, "epoch": 1.49, "percentage": 74.6, "elapsed_time": "14:11:44", "remaining_time": "4:49:56"} +{"current_steps": 5270, "total_steps": 7064, "loss": 0.7707, "reward": null, "learning_rate": 7.551787728929236e-06, "epoch": 1.49, "percentage": 74.6, "elapsed_time": "14:11:45", "remaining_time": "4:49:57"} +{"current_steps": 5280, "total_steps": 7064, "loss": 0.7855, "reward": null, "learning_rate": 7.472334749706214e-06, "epoch": 1.49, "percentage": 74.75, "elapsed_time": "14:13:21", "remaining_time": "4:48:20"} +{"current_steps": 5280, "total_steps": 7064, "loss": 0.7855, "reward": null, "learning_rate": 7.472334749706214e-06, "epoch": 1.49, "percentage": 74.75, "elapsed_time": "14:17:16", "remaining_time": "4:49:39"} +{"current_steps": 5280, "total_steps": 7064, "loss": 0.7855, "reward": null, "learning_rate": 7.472334749706214e-06, "epoch": 1.49, "percentage": 74.75, "elapsed_time": "14:13:22", "remaining_time": "4:48:20"} +{"current_steps": 5280, "total_steps": 7064, "loss": 0.7855, "reward": null, "learning_rate": 7.472334749706214e-06, "epoch": 1.49, "percentage": 74.75, "elapsed_time": "14:13:23", "remaining_time": "4:48:20"} +{"current_steps": 5290, "total_steps": 7064, "loss": 0.7601, "reward": null, "learning_rate": 7.393228444840228e-06, "epoch": 1.5, "percentage": 74.89, "elapsed_time": "14:15:00", "remaining_time": "4:46:43"} +{"current_steps": 5290, "total_steps": 7064, "loss": 0.7601, "reward": null, "learning_rate": 7.393228444840228e-06, "epoch": 1.5, "percentage": 74.89, "elapsed_time": "14:15:01", "remaining_time": "4:46:43"} +{"current_steps": 5290, "total_steps": 7064, "loss": 0.7601, "reward": null, "learning_rate": 7.393228444840228e-06, "epoch": 1.5, "percentage": 74.89, "elapsed_time": "14:18:54", "remaining_time": "4:48:02"} +{"current_steps": 5290, "total_steps": 7064, "loss": 0.7601, "reward": null, "learning_rate": 7.393228444840228e-06, "epoch": 1.5, "percentage": 74.89, "elapsed_time": "14:14:59", "remaining_time": "4:46:43"} +{"current_steps": 5300, "total_steps": 7064, "loss": 0.7741, "reward": null, "learning_rate": 7.314470378950802e-06, "epoch": 1.5, "percentage": 75.03, "elapsed_time": "14:16:35", "remaining_time": "4:45:05"} +{"current_steps": 5300, "total_steps": 7064, "loss": 0.7741, "reward": null, "learning_rate": 7.314470378950802e-06, "epoch": 1.5, "percentage": 75.03, "elapsed_time": "14:16:36", "remaining_time": "4:45:06"} +{"current_steps": 5300, "total_steps": 7064, "loss": 0.7741, "reward": null, "learning_rate": 7.314470378950802e-06, "epoch": 1.5, "percentage": 75.03, "elapsed_time": "14:16:37", "remaining_time": "4:45:06"} +{"current_steps": 5300, "total_steps": 7064, "loss": 0.7741, "reward": null, "learning_rate": 7.314470378950802e-06, "epoch": 1.5, "percentage": 75.03, "elapsed_time": "14:20:29", "remaining_time": "4:46:24"} +{"current_steps": 5310, "total_steps": 7064, "loss": 0.7733, "reward": null, "learning_rate": 7.23606210976975e-06, "epoch": 1.5, "percentage": 75.17, "elapsed_time": "14:18:15", "remaining_time": "4:43:30"} +{"current_steps": 5310, "total_steps": 7064, "loss": 0.7733, "reward": null, "learning_rate": 7.23606210976975e-06, "epoch": 1.5, "percentage": 75.17, "elapsed_time": "14:18:14", "remaining_time": "4:43:29"} +{"current_steps": 5310, "total_steps": 7064, "loss": 0.7733, "reward": null, "learning_rate": 7.23606210976975e-06, "epoch": 1.5, "percentage": 75.17, "elapsed_time": "14:22:09", "remaining_time": "4:44:47"} +{"current_steps": 5310, "total_steps": 7064, "loss": 0.7733, "reward": null, "learning_rate": 7.23606210976975e-06, "epoch": 1.5, "percentage": 75.17, "elapsed_time": "14:18:16", "remaining_time": "4:43:30"} +{"current_steps": 5320, "total_steps": 7064, "loss": 0.7881, "reward": null, "learning_rate": 7.158005188110381e-06, "epoch": 1.51, "percentage": 75.31, "elapsed_time": "14:19:51", "remaining_time": "4:41:52"} +{"current_steps": 5320, "total_steps": 7064, "loss": 0.7881, "reward": null, "learning_rate": 7.158005188110381e-06, "epoch": 1.51, "percentage": 75.31, "elapsed_time": "14:23:44", "remaining_time": "4:43:09"} +{"current_steps": 5320, "total_steps": 7064, "loss": 0.7881, "reward": null, "learning_rate": 7.158005188110381e-06, "epoch": 1.51, "percentage": 75.31, "elapsed_time": "14:19:49", "remaining_time": "4:41:52"} +{"current_steps": 5320, "total_steps": 7064, "loss": 0.7881, "reward": null, "learning_rate": 7.158005188110381e-06, "epoch": 1.51, "percentage": 75.31, "elapsed_time": "14:19:50", "remaining_time": "4:41:52"} +{"current_steps": 5330, "total_steps": 7064, "loss": 0.7761, "reward": null, "learning_rate": 7.080301157836783e-06, "epoch": 1.51, "percentage": 75.45, "elapsed_time": "14:21:25", "remaining_time": "4:40:14"} +{"current_steps": 5330, "total_steps": 7064, "loss": 0.7761, "reward": null, "learning_rate": 7.080301157836783e-06, "epoch": 1.51, "percentage": 75.45, "elapsed_time": "14:25:19", "remaining_time": "4:41:30"} +{"current_steps": 5330, "total_steps": 7064, "loss": 0.7761, "reward": null, "learning_rate": 7.080301157836783e-06, "epoch": 1.51, "percentage": 75.45, "elapsed_time": "14:21:24", "remaining_time": "4:40:14"} +{"current_steps": 5330, "total_steps": 7064, "loss": 0.7761, "reward": null, "learning_rate": 7.080301157836783e-06, "epoch": 1.51, "percentage": 75.45, "elapsed_time": "14:21:26", "remaining_time": "4:40:15"} +{"current_steps": 5340, "total_steps": 7064, "loss": 0.7692, "reward": null, "learning_rate": 7.002951555833334e-06, "epoch": 1.51, "percentage": 75.59, "elapsed_time": "14:23:03", "remaining_time": "4:38:38"} +{"current_steps": 5340, "total_steps": 7064, "loss": 0.7692, "reward": null, "learning_rate": 7.002951555833334e-06, "epoch": 1.51, "percentage": 75.59, "elapsed_time": "14:26:57", "remaining_time": "4:39:53"} +{"current_steps": 5340, "total_steps": 7064, "loss": 0.7692, "reward": null, "learning_rate": 7.002951555833334e-06, "epoch": 1.51, "percentage": 75.59, "elapsed_time": "14:23:04", "remaining_time": "4:38:38"} +{"current_steps": 5340, "total_steps": 7064, "loss": 0.7692, "reward": null, "learning_rate": 7.002951555833334e-06, "epoch": 1.51, "percentage": 75.59, "elapsed_time": "14:23:04", "remaining_time": "4:38:38"} +{"current_steps": 5350, "total_steps": 7064, "loss": 0.7656, "reward": null, "learning_rate": 6.925957911974262e-06, "epoch": 1.51, "percentage": 75.74, "elapsed_time": "14:24:40", "remaining_time": "4:37:01"} +{"current_steps": 5350, "total_steps": 7064, "loss": 0.7656, "reward": null, "learning_rate": 6.925957911974262e-06, "epoch": 1.51, "percentage": 75.74, "elapsed_time": "14:28:33", "remaining_time": "4:38:15"} +{"current_steps": 5350, "total_steps": 7064, "loss": 0.7656, "reward": null, "learning_rate": 6.925957911974262e-06, "epoch": 1.51, "percentage": 75.74, "elapsed_time": "14:24:41", "remaining_time": "4:37:01"} +{"current_steps": 5350, "total_steps": 7064, "loss": 0.7656, "reward": null, "learning_rate": 6.925957911974262e-06, "epoch": 1.51, "percentage": 75.74, "elapsed_time": "14:24:39", "remaining_time": "4:37:00"} +{"current_steps": 5360, "total_steps": 7064, "loss": 0.7754, "reward": null, "learning_rate": 6.849321749093432e-06, "epoch": 1.52, "percentage": 75.88, "elapsed_time": "14:26:12", "remaining_time": "4:35:22"} +{"current_steps": 5360, "total_steps": 7064, "loss": 0.7754, "reward": null, "learning_rate": 6.849321749093432e-06, "epoch": 1.52, "percentage": 75.88, "elapsed_time": "14:26:14", "remaining_time": "4:35:23"} +{"current_steps": 5360, "total_steps": 7064, "loss": 0.7754, "reward": null, "learning_rate": 6.849321749093432e-06, "epoch": 1.52, "percentage": 75.88, "elapsed_time": "14:30:07", "remaining_time": "4:36:37"} +{"current_steps": 5360, "total_steps": 7064, "loss": 0.7754, "reward": null, "learning_rate": 6.849321749093432e-06, "epoch": 1.52, "percentage": 75.88, "elapsed_time": "14:26:13", "remaining_time": "4:35:22"} +{"current_steps": 5370, "total_steps": 7064, "loss": 0.7828, "reward": null, "learning_rate": 6.773044582954172e-06, "epoch": 1.52, "percentage": 76.02, "elapsed_time": "14:27:51", "remaining_time": "4:33:46"} +{"current_steps": 5370, "total_steps": 7064, "loss": 0.7828, "reward": null, "learning_rate": 6.773044582954172e-06, "epoch": 1.52, "percentage": 76.02, "elapsed_time": "14:27:52", "remaining_time": "4:33:46"} +{"current_steps": 5370, "total_steps": 7064, "loss": 0.7828, "reward": null, "learning_rate": 6.773044582954172e-06, "epoch": 1.52, "percentage": 76.02, "elapsed_time": "14:31:45", "remaining_time": "4:35:00"} +{"current_steps": 5370, "total_steps": 7064, "loss": 0.7828, "reward": null, "learning_rate": 6.773044582954172e-06, "epoch": 1.52, "percentage": 76.02, "elapsed_time": "14:27:52", "remaining_time": "4:33:46"} +{"current_steps": 5380, "total_steps": 7064, "loss": 0.779, "reward": null, "learning_rate": 6.697127922219357e-06, "epoch": 1.52, "percentage": 76.16, "elapsed_time": "14:29:25", "remaining_time": "4:32:08"} +{"current_steps": 5380, "total_steps": 7064, "loss": 0.779, "reward": null, "learning_rate": 6.697127922219357e-06, "epoch": 1.52, "percentage": 76.16, "elapsed_time": "14:29:24", "remaining_time": "4:32:07"} +{"current_steps": 5380, "total_steps": 7064, "loss": 0.779, "reward": null, "learning_rate": 6.697127922219357e-06, "epoch": 1.52, "percentage": 76.16, "elapsed_time": "14:29:25", "remaining_time": "4:32:08"} +{"current_steps": 5380, "total_steps": 7064, "loss": 0.779, "reward": null, "learning_rate": 6.697127922219357e-06, "epoch": 1.52, "percentage": 76.16, "elapsed_time": "14:33:18", "remaining_time": "4:33:21"} +{"current_steps": 5390, "total_steps": 7064, "loss": 0.7856, "reward": null, "learning_rate": 6.621573268421505e-06, "epoch": 1.53, "percentage": 76.3, "elapsed_time": "14:31:03", "remaining_time": "4:30:31"} +{"current_steps": 5390, "total_steps": 7064, "loss": 0.7856, "reward": null, "learning_rate": 6.621573268421505e-06, "epoch": 1.53, "percentage": 76.3, "elapsed_time": "14:34:58", "remaining_time": "4:31:44"} +{"current_steps": 5390, "total_steps": 7064, "loss": 0.7856, "reward": null, "learning_rate": 6.621573268421505e-06, "epoch": 1.53, "percentage": 76.3, "elapsed_time": "14:31:05", "remaining_time": "4:30:32"} +{"current_steps": 5390, "total_steps": 7064, "loss": 0.7856, "reward": null, "learning_rate": 6.621573268421505e-06, "epoch": 1.53, "percentage": 76.3, "elapsed_time": "14:31:04", "remaining_time": "4:30:31"} +{"current_steps": 5400, "total_steps": 7064, "loss": 0.7908, "reward": null, "learning_rate": 6.546382115933117e-06, "epoch": 1.53, "percentage": 76.44, "elapsed_time": "14:32:37", "remaining_time": "4:28:53"} +{"current_steps": 5400, "total_steps": 7064, "loss": 0.7908, "reward": null, "learning_rate": 6.546382115933117e-06, "epoch": 1.53, "percentage": 76.44, "elapsed_time": "14:32:38", "remaining_time": "4:28:54"} +{"current_steps": 5400, "total_steps": 7064, "loss": 0.7908, "reward": null, "learning_rate": 6.546382115933117e-06, "epoch": 1.53, "percentage": 76.44, "elapsed_time": "14:36:32", "remaining_time": "4:30:06"} +{"current_steps": 5400, "total_steps": 7064, "loss": 0.7908, "reward": null, "learning_rate": 6.546382115933117e-06, "epoch": 1.53, "percentage": 76.44, "elapsed_time": "14:32:39", "remaining_time": "4:28:54"} +{"current_steps": 5410, "total_steps": 7064, "loss": 0.7899, "reward": null, "learning_rate": 6.47155595193713e-06, "epoch": 1.53, "percentage": 76.59, "elapsed_time": "14:34:17", "remaining_time": "4:27:17"} +{"current_steps": 5410, "total_steps": 7064, "loss": 0.7899, "reward": null, "learning_rate": 6.47155595193713e-06, "epoch": 1.53, "percentage": 76.59, "elapsed_time": "14:38:12", "remaining_time": "4:28:29"} +{"current_steps": 5410, "total_steps": 7064, "loss": 0.7899, "reward": null, "learning_rate": 6.47155595193713e-06, "epoch": 1.53, "percentage": 76.59, "elapsed_time": "14:34:18", "remaining_time": "4:27:18"} +{"current_steps": 5410, "total_steps": 7064, "loss": 0.7899, "reward": null, "learning_rate": 6.47155595193713e-06, "epoch": 1.53, "percentage": 76.59, "elapsed_time": "14:34:19", "remaining_time": "4:27:18"} +{"current_steps": 5420, "total_steps": 7064, "loss": 0.7736, "reward": null, "learning_rate": 6.397096256397456e-06, "epoch": 1.53, "percentage": 76.73, "elapsed_time": "14:35:57", "remaining_time": "4:25:41"} +{"current_steps": 5420, "total_steps": 7064, "loss": 0.7736, "reward": null, "learning_rate": 6.397096256397456e-06, "epoch": 1.53, "percentage": 76.73, "elapsed_time": "14:39:51", "remaining_time": "4:26:52"} +{"current_steps": 5420, "total_steps": 7064, "loss": 0.7736, "reward": null, "learning_rate": 6.397096256397456e-06, "epoch": 1.53, "percentage": 76.73, "elapsed_time": "14:35:58", "remaining_time": "4:25:41"} +{"current_steps": 5420, "total_steps": 7064, "loss": 0.7736, "reward": null, "learning_rate": 6.397096256397456e-06, "epoch": 1.53, "percentage": 76.73, "elapsed_time": "14:35:56", "remaining_time": "4:25:41"} +{"current_steps": 5430, "total_steps": 7064, "loss": 0.7788, "reward": null, "learning_rate": 6.323004502029767e-06, "epoch": 1.54, "percentage": 76.87, "elapsed_time": "14:41:28", "remaining_time": "4:25:15"} +{"current_steps": 5430, "total_steps": 7064, "loss": 0.7788, "reward": null, "learning_rate": 6.323004502029767e-06, "epoch": 1.54, "percentage": 76.87, "elapsed_time": "14:37:33", "remaining_time": "4:24:04"} +{"current_steps": 5430, "total_steps": 7064, "loss": 0.7788, "reward": null, "learning_rate": 6.323004502029767e-06, "epoch": 1.54, "percentage": 76.87, "elapsed_time": "14:37:34", "remaining_time": "4:24:04"} +{"current_steps": 5430, "total_steps": 7064, "loss": 0.7788, "reward": null, "learning_rate": 6.323004502029767e-06, "epoch": 1.54, "percentage": 76.87, "elapsed_time": "14:37:35", "remaining_time": "4:24:05"} +{"current_steps": 5440, "total_steps": 7064, "loss": 0.7729, "reward": null, "learning_rate": 6.249282154272315e-06, "epoch": 1.54, "percentage": 77.01, "elapsed_time": "14:39:14", "remaining_time": "4:22:28"} +{"current_steps": 5440, "total_steps": 7064, "loss": 0.7729, "reward": null, "learning_rate": 6.249282154272315e-06, "epoch": 1.54, "percentage": 77.01, "elapsed_time": "14:43:06", "remaining_time": "4:23:38"} +{"current_steps": 5440, "total_steps": 7064, "loss": 0.7729, "reward": null, "learning_rate": 6.249282154272315e-06, "epoch": 1.54, "percentage": 77.01, "elapsed_time": "14:39:12", "remaining_time": "4:22:28"} +{"current_steps": 5440, "total_steps": 7064, "loss": 0.7729, "reward": null, "learning_rate": 6.249282154272315e-06, "epoch": 1.54, "percentage": 77.01, "elapsed_time": "14:39:13", "remaining_time": "4:22:28"} +{"current_steps": 5450, "total_steps": 7064, "loss": 0.7706, "reward": null, "learning_rate": 6.175930671256991e-06, "epoch": 1.54, "percentage": 77.15, "elapsed_time": "14:40:47", "remaining_time": "4:20:50"} +{"current_steps": 5450, "total_steps": 7064, "loss": 0.7706, "reward": null, "learning_rate": 6.175930671256991e-06, "epoch": 1.54, "percentage": 77.15, "elapsed_time": "14:40:48", "remaining_time": "4:20:50"} +{"current_steps": 5450, "total_steps": 7064, "loss": 0.7706, "reward": null, "learning_rate": 6.175930671256991e-06, "epoch": 1.54, "percentage": 77.15, "elapsed_time": "14:40:49", "remaining_time": "4:20:51"} +{"current_steps": 5450, "total_steps": 7064, "loss": 0.7706, "reward": null, "learning_rate": 6.175930671256991e-06, "epoch": 1.54, "percentage": 77.15, "elapsed_time": "14:44:42", "remaining_time": "4:22:00"} +{"current_steps": 5460, "total_steps": 7064, "loss": 0.7915, "reward": null, "learning_rate": 6.102951503780449e-06, "epoch": 1.55, "percentage": 77.29, "elapsed_time": "14:42:26", "remaining_time": "4:19:14"} +{"current_steps": 5460, "total_steps": 7064, "loss": 0.7915, "reward": null, "learning_rate": 6.102951503780449e-06, "epoch": 1.55, "percentage": 77.29, "elapsed_time": "14:42:25", "remaining_time": "4:19:13"} +{"current_steps": 5460, "total_steps": 7064, "loss": 0.7915, "reward": null, "learning_rate": 6.102951503780449e-06, "epoch": 1.55, "percentage": 77.29, "elapsed_time": "14:46:19", "remaining_time": "4:20:22"} +{"current_steps": 5460, "total_steps": 7064, "loss": 0.7915, "reward": null, "learning_rate": 6.102951503780449e-06, "epoch": 1.55, "percentage": 77.29, "elapsed_time": "14:42:27", "remaining_time": "4:19:14"} +{"current_steps": 5470, "total_steps": 7064, "loss": 0.7893, "reward": null, "learning_rate": 6.030346095275438e-06, "epoch": 1.55, "percentage": 77.43, "elapsed_time": "14:44:02", "remaining_time": "4:17:37"} +{"current_steps": 5470, "total_steps": 7064, "loss": 0.7893, "reward": null, "learning_rate": 6.030346095275438e-06, "epoch": 1.55, "percentage": 77.43, "elapsed_time": "14:44:04", "remaining_time": "4:17:37"} +{"current_steps": 5470, "total_steps": 7064, "loss": 0.7893, "reward": null, "learning_rate": 6.030346095275438e-06, "epoch": 1.55, "percentage": 77.43, "elapsed_time": "14:47:57", "remaining_time": "4:18:45"} +{"current_steps": 5470, "total_steps": 7064, "loss": 0.7893, "reward": null, "learning_rate": 6.030346095275438e-06, "epoch": 1.55, "percentage": 77.43, "elapsed_time": "14:44:03", "remaining_time": "4:17:37"} +{"current_steps": 5480, "total_steps": 7064, "loss": 0.7813, "reward": null, "learning_rate": 5.958115881782228e-06, "epoch": 1.55, "percentage": 77.58, "elapsed_time": "14:49:34", "remaining_time": "4:17:07"} +{"current_steps": 5480, "total_steps": 7064, "loss": 0.7813, "reward": null, "learning_rate": 5.958115881782228e-06, "epoch": 1.55, "percentage": 77.58, "elapsed_time": "14:45:41", "remaining_time": "4:16:00"} +{"current_steps": 5480, "total_steps": 7064, "loss": 0.7813, "reward": null, "learning_rate": 5.958115881782228e-06, "epoch": 1.55, "percentage": 77.58, "elapsed_time": "14:45:40", "remaining_time": "4:16:00"} +{"current_steps": 5480, "total_steps": 7064, "loss": 0.7813, "reward": null, "learning_rate": 5.958115881782228e-06, "epoch": 1.55, "percentage": 77.58, "elapsed_time": "14:45:39", "remaining_time": "4:16:00"} +{"current_steps": 5490, "total_steps": 7064, "loss": 0.793, "reward": null, "learning_rate": 5.886262291920244e-06, "epoch": 1.55, "percentage": 77.72, "elapsed_time": "14:51:09", "remaining_time": "4:15:29"} +{"current_steps": 5490, "total_steps": 7064, "loss": 0.793, "reward": null, "learning_rate": 5.886262291920244e-06, "epoch": 1.55, "percentage": 77.72, "elapsed_time": "14:47:14", "remaining_time": "4:14:22"} +{"current_steps": 5490, "total_steps": 7064, "loss": 0.793, "reward": null, "learning_rate": 5.886262291920244e-06, "epoch": 1.55, "percentage": 77.72, "elapsed_time": "14:47:15", "remaining_time": "4:14:22"} +{"current_steps": 5490, "total_steps": 7064, "loss": 0.793, "reward": null, "learning_rate": 5.886262291920244e-06, "epoch": 1.55, "percentage": 77.72, "elapsed_time": "14:47:16", "remaining_time": "4:14:23"} +{"current_steps": 5500, "total_steps": 7064, "loss": 0.7801, "reward": null, "learning_rate": 5.81478674685976e-06, "epoch": 1.56, "percentage": 77.86, "elapsed_time": "14:48:50", "remaining_time": "4:12:45"} +{"current_steps": 5500, "total_steps": 7064, "loss": 0.7801, "reward": null, "learning_rate": 5.81478674685976e-06, "epoch": 1.56, "percentage": 77.86, "elapsed_time": "14:48:51", "remaining_time": "4:12:45"} +{"current_steps": 5500, "total_steps": 7064, "loss": 0.7801, "reward": null, "learning_rate": 5.81478674685976e-06, "epoch": 1.56, "percentage": 77.86, "elapsed_time": "14:52:45", "remaining_time": "4:13:52"} +{"current_steps": 5500, "total_steps": 7064, "loss": 0.7801, "reward": null, "learning_rate": 5.81478674685976e-06, "epoch": 1.56, "percentage": 77.86, "elapsed_time": "14:48:52", "remaining_time": "4:12:45"} +{"current_steps": 5510, "total_steps": 7064, "loss": 0.7878, "reward": null, "learning_rate": 5.7436906602938435e-06, "epoch": 1.56, "percentage": 78.0, "elapsed_time": "14:50:28", "remaining_time": "4:11:08"} +{"current_steps": 5510, "total_steps": 7064, "loss": 0.7878, "reward": null, "learning_rate": 5.7436906602938435e-06, "epoch": 1.56, "percentage": 78.0, "elapsed_time": "14:54:23", "remaining_time": "4:12:14"} +{"current_steps": 5510, "total_steps": 7064, "loss": 0.7878, "reward": null, "learning_rate": 5.7436906602938435e-06, "epoch": 1.56, "percentage": 78.0, "elapsed_time": "14:50:30", "remaining_time": "4:11:09"} +{"current_steps": 5510, "total_steps": 7064, "loss": 0.7878, "reward": null, "learning_rate": 5.7436906602938435e-06, "epoch": 1.56, "percentage": 78.0, "elapsed_time": "14:50:29", "remaining_time": "4:11:08"} +{"current_steps": 5520, "total_steps": 7064, "loss": 0.7762, "reward": null, "learning_rate": 5.672975438410344e-06, "epoch": 1.56, "percentage": 78.14, "elapsed_time": "14:52:08", "remaining_time": "4:09:32"} +{"current_steps": 5520, "total_steps": 7064, "loss": 0.7762, "reward": null, "learning_rate": 5.672975438410344e-06, "epoch": 1.56, "percentage": 78.14, "elapsed_time": "14:52:10", "remaining_time": "4:09:32"} +{"current_steps": 5520, "total_steps": 7064, "loss": 0.7762, "reward": null, "learning_rate": 5.672975438410344e-06, "epoch": 1.56, "percentage": 78.14, "elapsed_time": "14:56:03", "remaining_time": "4:10:38"} +{"current_steps": 5520, "total_steps": 7064, "loss": 0.7762, "reward": null, "learning_rate": 5.672975438410344e-06, "epoch": 1.56, "percentage": 78.14, "elapsed_time": "14:52:09", "remaining_time": "4:09:32"} +{"current_steps": 5530, "total_steps": 7064, "loss": 0.7775, "reward": null, "learning_rate": 5.602642479864129e-06, "epoch": 1.57, "percentage": 78.28, "elapsed_time": "14:53:43", "remaining_time": "4:07:55"} +{"current_steps": 5530, "total_steps": 7064, "loss": 0.7775, "reward": null, "learning_rate": 5.602642479864129e-06, "epoch": 1.57, "percentage": 78.28, "elapsed_time": "14:57:38", "remaining_time": "4:09:00"} +{"current_steps": 5530, "total_steps": 7064, "loss": 0.7775, "reward": null, "learning_rate": 5.602642479864129e-06, "epoch": 1.57, "percentage": 78.28, "elapsed_time": "14:53:45", "remaining_time": "4:07:55"} +{"current_steps": 5530, "total_steps": 7064, "loss": 0.7775, "reward": null, "learning_rate": 5.602642479864129e-06, "epoch": 1.57, "percentage": 78.28, "elapsed_time": "14:53:44", "remaining_time": "4:07:55"} +{"current_steps": 5540, "total_steps": 7064, "loss": 0.7689, "reward": null, "learning_rate": 5.532693175749373e-06, "epoch": 1.57, "percentage": 78.43, "elapsed_time": "14:55:16", "remaining_time": "4:06:16"} +{"current_steps": 5540, "total_steps": 7064, "loss": 0.7689, "reward": null, "learning_rate": 5.532693175749373e-06, "epoch": 1.57, "percentage": 78.43, "elapsed_time": "14:59:11", "remaining_time": "4:07:21"} +{"current_steps": 5540, "total_steps": 7064, "loss": 0.7689, "reward": null, "learning_rate": 5.532693175749373e-06, "epoch": 1.57, "percentage": 78.43, "elapsed_time": "14:55:18", "remaining_time": "4:06:17"} +{"current_steps": 5540, "total_steps": 7064, "loss": 0.7689, "reward": null, "learning_rate": 5.532693175749373e-06, "epoch": 1.57, "percentage": 78.43, "elapsed_time": "14:55:17", "remaining_time": "4:06:17"} +{"current_steps": 5550, "total_steps": 7064, "loss": 0.7755, "reward": null, "learning_rate": 5.463128909572077e-06, "epoch": 1.57, "percentage": 78.57, "elapsed_time": "14:56:55", "remaining_time": "4:04:40"} +{"current_steps": 5550, "total_steps": 7064, "loss": 0.7755, "reward": null, "learning_rate": 5.463128909572077e-06, "epoch": 1.57, "percentage": 78.57, "elapsed_time": "14:56:56", "remaining_time": "4:04:40"} +{"current_steps": 5550, "total_steps": 7064, "loss": 0.7755, "reward": null, "learning_rate": 5.463128909572077e-06, "epoch": 1.57, "percentage": 78.57, "elapsed_time": "14:56:56", "remaining_time": "4:04:40"} +{"current_steps": 5550, "total_steps": 7064, "loss": 0.7755, "reward": null, "learning_rate": 5.463128909572077e-06, "epoch": 1.57, "percentage": 78.57, "elapsed_time": "15:00:49", "remaining_time": "4:05:44"} +{"current_steps": 5560, "total_steps": 7064, "loss": 0.7878, "reward": null, "learning_rate": 5.393951057222685e-06, "epoch": 1.57, "percentage": 78.71, "elapsed_time": "14:58:31", "remaining_time": "4:03:03"} +{"current_steps": 5560, "total_steps": 7064, "loss": 0.7878, "reward": null, "learning_rate": 5.393951057222685e-06, "epoch": 1.57, "percentage": 78.71, "elapsed_time": "15:02:25", "remaining_time": "4:04:06"} +{"current_steps": 5560, "total_steps": 7064, "loss": 0.7878, "reward": null, "learning_rate": 5.393951057222685e-06, "epoch": 1.57, "percentage": 78.71, "elapsed_time": "14:58:33", "remaining_time": "4:03:03"} +{"current_steps": 5560, "total_steps": 7064, "loss": 0.7878, "reward": null, "learning_rate": 5.393951057222685e-06, "epoch": 1.57, "percentage": 78.71, "elapsed_time": "14:58:32", "remaining_time": "4:03:03"} +{"current_steps": 5570, "total_steps": 7064, "loss": 0.7759, "reward": null, "learning_rate": 5.325160986948899e-06, "epoch": 1.58, "percentage": 78.85, "elapsed_time": "15:00:07", "remaining_time": "4:01:26"} +{"current_steps": 5570, "total_steps": 7064, "loss": 0.7759, "reward": null, "learning_rate": 5.325160986948899e-06, "epoch": 1.58, "percentage": 78.85, "elapsed_time": "15:00:09", "remaining_time": "4:01:26"} +{"current_steps": 5570, "total_steps": 7064, "loss": 0.7759, "reward": null, "learning_rate": 5.325160986948899e-06, "epoch": 1.58, "percentage": 78.85, "elapsed_time": "15:04:02", "remaining_time": "4:02:29"} +{"current_steps": 5570, "total_steps": 7064, "loss": 0.7759, "reward": null, "learning_rate": 5.325160986948899e-06, "epoch": 1.58, "percentage": 78.85, "elapsed_time": "15:00:08", "remaining_time": "4:01:26"} +{"current_steps": 5580, "total_steps": 7064, "loss": 0.7698, "reward": null, "learning_rate": 5.256760059328572e-06, "epoch": 1.58, "percentage": 78.99, "elapsed_time": "15:01:47", "remaining_time": "3:59:49"} +{"current_steps": 5580, "total_steps": 7064, "loss": 0.7698, "reward": null, "learning_rate": 5.256760059328572e-06, "epoch": 1.58, "percentage": 78.99, "elapsed_time": "15:05:40", "remaining_time": "4:00:51"} +{"current_steps": 5580, "total_steps": 7064, "loss": 0.7698, "reward": null, "learning_rate": 5.256760059328572e-06, "epoch": 1.58, "percentage": 78.99, "elapsed_time": "15:01:46", "remaining_time": "3:59:49"} +{"current_steps": 5580, "total_steps": 7064, "loss": 0.7698, "reward": null, "learning_rate": 5.256760059328572e-06, "epoch": 1.58, "percentage": 78.99, "elapsed_time": "15:01:47", "remaining_time": "3:59:50"} +{"current_steps": 5590, "total_steps": 7064, "loss": 0.7853, "reward": null, "learning_rate": 5.188749627242851e-06, "epoch": 1.58, "percentage": 79.13, "elapsed_time": "15:03:25", "remaining_time": "3:58:13"} +{"current_steps": 5590, "total_steps": 7064, "loss": 0.7853, "reward": null, "learning_rate": 5.188749627242851e-06, "epoch": 1.58, "percentage": 79.13, "elapsed_time": "15:03:27", "remaining_time": "3:58:13"} +{"current_steps": 5590, "total_steps": 7064, "loss": 0.7853, "reward": null, "learning_rate": 5.188749627242851e-06, "epoch": 1.58, "percentage": 79.13, "elapsed_time": "15:03:26", "remaining_time": "3:58:13"} +{"current_steps": 5590, "total_steps": 7064, "loss": 0.7853, "reward": null, "learning_rate": 5.188749627242851e-06, "epoch": 1.58, "percentage": 79.13, "elapsed_time": "15:07:20", "remaining_time": "3:59:15"} +{"current_steps": 5600, "total_steps": 7064, "loss": 0.7886, "reward": null, "learning_rate": 5.121131035849361e-06, "epoch": 1.59, "percentage": 79.28, "elapsed_time": "15:05:01", "remaining_time": "3:56:35"} +{"current_steps": 5600, "total_steps": 7064, "loss": 0.7886, "reward": null, "learning_rate": 5.121131035849361e-06, "epoch": 1.59, "percentage": 79.28, "elapsed_time": "15:08:55", "remaining_time": "3:57:37"} +{"current_steps": 5600, "total_steps": 7064, "loss": 0.7886, "reward": null, "learning_rate": 5.121131035849361e-06, "epoch": 1.59, "percentage": 79.28, "elapsed_time": "15:05:02", "remaining_time": "3:56:36"} +{"current_steps": 5600, "total_steps": 7064, "loss": 0.7886, "reward": null, "learning_rate": 5.121131035849361e-06, "epoch": 1.59, "percentage": 79.28, "elapsed_time": "15:05:00", "remaining_time": "3:56:35"} +{"current_steps": 5610, "total_steps": 7064, "loss": 0.7869, "reward": null, "learning_rate": 5.053905622555657e-06, "epoch": 1.59, "percentage": 79.42, "elapsed_time": "15:06:35", "remaining_time": "3:54:58"} +{"current_steps": 5610, "total_steps": 7064, "loss": 0.7869, "reward": null, "learning_rate": 5.053905622555657e-06, "epoch": 1.59, "percentage": 79.42, "elapsed_time": "15:06:35", "remaining_time": "3:54:58"} +{"current_steps": 5610, "total_steps": 7064, "loss": 0.7869, "reward": null, "learning_rate": 5.053905622555657e-06, "epoch": 1.59, "percentage": 79.42, "elapsed_time": "15:06:36", "remaining_time": "3:54:58"} +{"current_steps": 5610, "total_steps": 7064, "loss": 0.7869, "reward": null, "learning_rate": 5.053905622555657e-06, "epoch": 1.59, "percentage": 79.42, "elapsed_time": "15:10:29", "remaining_time": "3:55:58"} +{"current_steps": 5620, "total_steps": 7064, "loss": 0.7882, "reward": null, "learning_rate": 4.987074716992724e-06, "epoch": 1.59, "percentage": 79.56, "elapsed_time": "15:08:14", "remaining_time": "3:53:21"} +{"current_steps": 5620, "total_steps": 7064, "loss": 0.7882, "reward": null, "learning_rate": 4.987074716992724e-06, "epoch": 1.59, "percentage": 79.56, "elapsed_time": "15:12:09", "remaining_time": "3:54:22"} +{"current_steps": 5620, "total_steps": 7064, "loss": 0.7882, "reward": null, "learning_rate": 4.987074716992724e-06, "epoch": 1.59, "percentage": 79.56, "elapsed_time": "15:08:16", "remaining_time": "3:53:22"} +{"current_steps": 5620, "total_steps": 7064, "loss": 0.7882, "reward": null, "learning_rate": 4.987074716992724e-06, "epoch": 1.59, "percentage": 79.56, "elapsed_time": "15:08:15", "remaining_time": "3:53:22"} +{"current_steps": 5630, "total_steps": 7064, "loss": 0.7854, "reward": null, "learning_rate": 4.920639640988697e-06, "epoch": 1.59, "percentage": 79.7, "elapsed_time": "15:09:51", "remaining_time": "3:51:44"} +{"current_steps": 5630, "total_steps": 7064, "loss": 0.7854, "reward": null, "learning_rate": 4.920639640988697e-06, "epoch": 1.59, "percentage": 79.7, "elapsed_time": "15:13:45", "remaining_time": "3:52:44"} +{"current_steps": 5630, "total_steps": 7064, "loss": 0.7854, "reward": null, "learning_rate": 4.920639640988697e-06, "epoch": 1.59, "percentage": 79.7, "elapsed_time": "15:09:53", "remaining_time": "3:51:45"} +{"current_steps": 5630, "total_steps": 7064, "loss": 0.7854, "reward": null, "learning_rate": 4.920639640988697e-06, "epoch": 1.59, "percentage": 79.7, "elapsed_time": "15:09:52", "remaining_time": "3:51:45"} +{"current_steps": 5640, "total_steps": 7064, "loss": 0.7807, "reward": null, "learning_rate": 4.854601708542747e-06, "epoch": 1.6, "percentage": 79.84, "elapsed_time": "15:11:28", "remaining_time": "3:50:07"} +{"current_steps": 5640, "total_steps": 7064, "loss": 0.7807, "reward": null, "learning_rate": 4.854601708542747e-06, "epoch": 1.6, "percentage": 79.84, "elapsed_time": "15:15:22", "remaining_time": "3:51:07"} +{"current_steps": 5640, "total_steps": 7064, "loss": 0.7807, "reward": null, "learning_rate": 4.854601708542747e-06, "epoch": 1.6, "percentage": 79.84, "elapsed_time": "15:11:29", "remaining_time": "3:50:08"} +{"current_steps": 5640, "total_steps": 7064, "loss": 0.7807, "reward": null, "learning_rate": 4.854601708542747e-06, "epoch": 1.6, "percentage": 79.84, "elapsed_time": "15:11:30", "remaining_time": "3:50:08"} +{"current_steps": 5650, "total_steps": 7064, "loss": 0.7819, "reward": null, "learning_rate": 4.7889622257990205e-06, "epoch": 1.6, "percentage": 79.98, "elapsed_time": "15:13:04", "remaining_time": "3:48:30"} +{"current_steps": 5650, "total_steps": 7064, "loss": 0.7819, "reward": null, "learning_rate": 4.7889622257990205e-06, "epoch": 1.6, "percentage": 79.98, "elapsed_time": "15:16:58", "remaining_time": "3:49:29"} +{"current_steps": 5650, "total_steps": 7064, "loss": 0.7819, "reward": null, "learning_rate": 4.7889622257990205e-06, "epoch": 1.6, "percentage": 79.98, "elapsed_time": "15:13:04", "remaining_time": "3:48:30"} +{"current_steps": 5650, "total_steps": 7064, "loss": 0.7819, "reward": null, "learning_rate": 4.7889622257990205e-06, "epoch": 1.6, "percentage": 79.98, "elapsed_time": "15:13:05", "remaining_time": "3:48:30"} +{"current_steps": 5660, "total_steps": 7064, "loss": 0.7755, "reward": null, "learning_rate": 4.7237224910208935e-06, "epoch": 1.6, "percentage": 80.12, "elapsed_time": "15:14:39", "remaining_time": "3:46:53"} +{"current_steps": 5660, "total_steps": 7064, "loss": 0.7755, "reward": null, "learning_rate": 4.7237224910208935e-06, "epoch": 1.6, "percentage": 80.12, "elapsed_time": "15:14:38", "remaining_time": "3:46:53"} +{"current_steps": 5660, "total_steps": 7064, "loss": 0.7755, "reward": null, "learning_rate": 4.7237224910208935e-06, "epoch": 1.6, "percentage": 80.12, "elapsed_time": "15:14:40", "remaining_time": "3:46:53"} +{"current_steps": 5660, "total_steps": 7064, "loss": 0.7755, "reward": null, "learning_rate": 4.7237224910208935e-06, "epoch": 1.6, "percentage": 80.12, "elapsed_time": "15:18:33", "remaining_time": "3:47:51"} +{"current_steps": 5670, "total_steps": 7064, "loss": 0.7829, "reward": null, "learning_rate": 4.658883794565208e-06, "epoch": 1.61, "percentage": 80.27, "elapsed_time": "15:16:16", "remaining_time": "3:45:16"} +{"current_steps": 5670, "total_steps": 7064, "loss": 0.7829, "reward": null, "learning_rate": 4.658883794565208e-06, "epoch": 1.61, "percentage": 80.27, "elapsed_time": "15:16:17", "remaining_time": "3:45:16"} +{"current_steps": 5670, "total_steps": 7064, "loss": 0.7829, "reward": null, "learning_rate": 4.658883794565208e-06, "epoch": 1.61, "percentage": 80.27, "elapsed_time": "15:20:11", "remaining_time": "3:46:14"} +{"current_steps": 5670, "total_steps": 7064, "loss": 0.7829, "reward": null, "learning_rate": 4.658883794565208e-06, "epoch": 1.61, "percentage": 80.27, "elapsed_time": "15:16:18", "remaining_time": "3:45:16"} +{"current_steps": 5680, "total_steps": 7064, "loss": 0.7761, "reward": null, "learning_rate": 4.594447418856823e-06, "epoch": 1.61, "percentage": 80.41, "elapsed_time": "15:17:54", "remaining_time": "3:43:39"} +{"current_steps": 5680, "total_steps": 7064, "loss": 0.7761, "reward": null, "learning_rate": 4.594447418856823e-06, "epoch": 1.61, "percentage": 80.41, "elapsed_time": "15:17:56", "remaining_time": "3:43:40"} +{"current_steps": 5680, "total_steps": 7064, "loss": 0.7761, "reward": null, "learning_rate": 4.594447418856823e-06, "epoch": 1.61, "percentage": 80.41, "elapsed_time": "15:21:49", "remaining_time": "3:44:36"} +{"current_steps": 5680, "total_steps": 7064, "loss": 0.7761, "reward": null, "learning_rate": 4.594447418856823e-06, "epoch": 1.61, "percentage": 80.41, "elapsed_time": "15:17:55", "remaining_time": "3:43:39"} +{"current_steps": 5690, "total_steps": 7064, "loss": 0.7742, "reward": null, "learning_rate": 4.530414638363201e-06, "epoch": 1.61, "percentage": 80.55, "elapsed_time": "15:19:32", "remaining_time": "3:42:02"} +{"current_steps": 5690, "total_steps": 7064, "loss": 0.7742, "reward": null, "learning_rate": 4.530414638363201e-06, "epoch": 1.61, "percentage": 80.55, "elapsed_time": "15:19:33", "remaining_time": "3:42:03"} +{"current_steps": 5690, "total_steps": 7064, "loss": 0.7742, "reward": null, "learning_rate": 4.530414638363201e-06, "epoch": 1.61, "percentage": 80.55, "elapsed_time": "15:23:26", "remaining_time": "3:42:59"} +{"current_steps": 5690, "total_steps": 7064, "loss": 0.7742, "reward": null, "learning_rate": 4.530414638363201e-06, "epoch": 1.61, "percentage": 80.55, "elapsed_time": "15:19:32", "remaining_time": "3:42:02"} +{"current_steps": 5700, "total_steps": 7064, "loss": 0.7744, "reward": null, "learning_rate": 4.466786719569221e-06, "epoch": 1.61, "percentage": 80.69, "elapsed_time": "15:25:02", "remaining_time": "3:41:21"} +{"current_steps": 5700, "total_steps": 7064, "loss": 0.7744, "reward": null, "learning_rate": 4.466786719569221e-06, "epoch": 1.61, "percentage": 80.69, "elapsed_time": "15:21:08", "remaining_time": "3:40:25"} +{"current_steps": 5700, "total_steps": 7064, "loss": 0.7744, "reward": null, "learning_rate": 4.466786719569221e-06, "epoch": 1.61, "percentage": 80.69, "elapsed_time": "15:21:09", "remaining_time": "3:40:25"} +{"current_steps": 5700, "total_steps": 7064, "loss": 0.7744, "reward": null, "learning_rate": 4.466786719569221e-06, "epoch": 1.61, "percentage": 80.69, "elapsed_time": "15:21:07", "remaining_time": "3:40:25"} +{"current_steps": 5710, "total_steps": 7064, "loss": 0.78, "reward": null, "learning_rate": 4.403564920952116e-06, "epoch": 1.62, "percentage": 80.83, "elapsed_time": "15:26:33", "remaining_time": "3:39:42"} +{"current_steps": 5710, "total_steps": 7064, "loss": 0.78, "reward": null, "learning_rate": 4.403564920952116e-06, "epoch": 1.62, "percentage": 80.83, "elapsed_time": "15:22:40", "remaining_time": "3:38:47"} +{"current_steps": 5710, "total_steps": 7064, "loss": 0.78, "reward": null, "learning_rate": 4.403564920952116e-06, "epoch": 1.62, "percentage": 80.83, "elapsed_time": "15:22:39", "remaining_time": "3:38:47"} +{"current_steps": 5710, "total_steps": 7064, "loss": 0.78, "reward": null, "learning_rate": 4.403564920952116e-06, "epoch": 1.62, "percentage": 80.83, "elapsed_time": "15:22:38", "remaining_time": "3:38:47"} +{"current_steps": 5720, "total_steps": 7064, "loss": 0.7847, "reward": null, "learning_rate": 4.3407504929566166e-06, "epoch": 1.62, "percentage": 80.97, "elapsed_time": "15:24:16", "remaining_time": "3:37:10"} +{"current_steps": 5720, "total_steps": 7064, "loss": 0.7847, "reward": null, "learning_rate": 4.3407504929566166e-06, "epoch": 1.62, "percentage": 80.97, "elapsed_time": "15:24:15", "remaining_time": "3:37:10"} +{"current_steps": 5720, "total_steps": 7064, "loss": 0.7847, "reward": null, "learning_rate": 4.3407504929566166e-06, "epoch": 1.62, "percentage": 80.97, "elapsed_time": "15:24:17", "remaining_time": "3:37:10"} +{"current_steps": 5720, "total_steps": 7064, "loss": 0.7847, "reward": null, "learning_rate": 4.3407504929566166e-06, "epoch": 1.62, "percentage": 80.97, "elapsed_time": "15:28:10", "remaining_time": "3:38:05"} +{"current_steps": 5730, "total_steps": 7064, "loss": 0.7837, "reward": null, "learning_rate": 4.278344677970167e-06, "epoch": 1.62, "percentage": 81.12, "elapsed_time": "15:25:52", "remaining_time": "3:35:33"} +{"current_steps": 5730, "total_steps": 7064, "loss": 0.7837, "reward": null, "learning_rate": 4.278344677970167e-06, "epoch": 1.62, "percentage": 81.12, "elapsed_time": "15:29:47", "remaining_time": "3:36:27"} +{"current_steps": 5730, "total_steps": 7064, "loss": 0.7837, "reward": null, "learning_rate": 4.278344677970167e-06, "epoch": 1.62, "percentage": 81.12, "elapsed_time": "15:25:54", "remaining_time": "3:35:33"} +{"current_steps": 5730, "total_steps": 7064, "loss": 0.7837, "reward": null, "learning_rate": 4.278344677970167e-06, "epoch": 1.62, "percentage": 81.12, "elapsed_time": "15:25:53", "remaining_time": "3:35:33"} +{"current_steps": 5740, "total_steps": 7064, "loss": 0.774, "reward": null, "learning_rate": 4.216348710298401e-06, "epoch": 1.63, "percentage": 81.26, "elapsed_time": "15:27:33", "remaining_time": "3:33:57"} +{"current_steps": 5740, "total_steps": 7064, "loss": 0.774, "reward": null, "learning_rate": 4.216348710298401e-06, "epoch": 1.63, "percentage": 81.26, "elapsed_time": "15:31:28", "remaining_time": "3:34:51"} +{"current_steps": 5740, "total_steps": 7064, "loss": 0.774, "reward": null, "learning_rate": 4.216348710298401e-06, "epoch": 1.63, "percentage": 81.26, "elapsed_time": "15:27:34", "remaining_time": "3:33:57"} +{"current_steps": 5740, "total_steps": 7064, "loss": 0.774, "reward": null, "learning_rate": 4.216348710298401e-06, "epoch": 1.63, "percentage": 81.26, "elapsed_time": "15:27:35", "remaining_time": "3:33:57"} +{"current_steps": 5750, "total_steps": 7064, "loss": 0.7826, "reward": null, "learning_rate": 4.154763816140686e-06, "epoch": 1.63, "percentage": 81.4, "elapsed_time": "15:29:08", "remaining_time": "3:32:19"} +{"current_steps": 5750, "total_steps": 7064, "loss": 0.7826, "reward": null, "learning_rate": 4.154763816140686e-06, "epoch": 1.63, "percentage": 81.4, "elapsed_time": "15:29:07", "remaining_time": "3:32:19"} +{"current_steps": 5750, "total_steps": 7064, "loss": 0.7826, "reward": null, "learning_rate": 4.154763816140686e-06, "epoch": 1.63, "percentage": 81.4, "elapsed_time": "15:33:02", "remaining_time": "3:33:13"} +{"current_steps": 5750, "total_steps": 7064, "loss": 0.7826, "reward": null, "learning_rate": 4.154763816140686e-06, "epoch": 1.63, "percentage": 81.4, "elapsed_time": "15:29:09", "remaining_time": "3:32:19"} +{"current_steps": 5760, "total_steps": 7064, "loss": 0.7881, "reward": null, "learning_rate": 4.093591213565914e-06, "epoch": 1.63, "percentage": 81.54, "elapsed_time": "15:34:37", "remaining_time": "3:31:35"} +{"current_steps": 5760, "total_steps": 7064, "loss": 0.7881, "reward": null, "learning_rate": 4.093591213565914e-06, "epoch": 1.63, "percentage": 81.54, "elapsed_time": "15:30:44", "remaining_time": "3:30:42"} +{"current_steps": 5760, "total_steps": 7064, "loss": 0.7881, "reward": null, "learning_rate": 4.093591213565914e-06, "epoch": 1.63, "percentage": 81.54, "elapsed_time": "15:30:43", "remaining_time": "3:30:42"} +{"current_steps": 5760, "total_steps": 7064, "loss": 0.7881, "reward": null, "learning_rate": 4.093591213565914e-06, "epoch": 1.63, "percentage": 81.54, "elapsed_time": "15:30:43", "remaining_time": "3:30:42"} +{"current_steps": 5770, "total_steps": 7064, "loss": 0.7878, "reward": null, "learning_rate": 4.032832112488369e-06, "epoch": 1.63, "percentage": 81.68, "elapsed_time": "15:32:22", "remaining_time": "3:29:05"} +{"current_steps": 5770, "total_steps": 7064, "loss": 0.7878, "reward": null, "learning_rate": 4.032832112488369e-06, "epoch": 1.63, "percentage": 81.68, "elapsed_time": "15:32:21", "remaining_time": "3:29:05"} +{"current_steps": 5770, "total_steps": 7064, "loss": 0.7878, "reward": null, "learning_rate": 4.032832112488369e-06, "epoch": 1.63, "percentage": 81.68, "elapsed_time": "15:36:15", "remaining_time": "3:29:58"} +{"current_steps": 5770, "total_steps": 7064, "loss": 0.7878, "reward": null, "learning_rate": 4.032832112488369e-06, "epoch": 1.63, "percentage": 81.68, "elapsed_time": "15:32:23", "remaining_time": "3:29:05"} +{"current_steps": 5780, "total_steps": 7064, "loss": 0.7722, "reward": null, "learning_rate": 3.972487714643822e-06, "epoch": 1.64, "percentage": 81.82, "elapsed_time": "15:33:57", "remaining_time": "3:27:28"} +{"current_steps": 5780, "total_steps": 7064, "loss": 0.7722, "reward": null, "learning_rate": 3.972487714643822e-06, "epoch": 1.64, "percentage": 81.82, "elapsed_time": "15:37:51", "remaining_time": "3:28:20"} +{"current_steps": 5780, "total_steps": 7064, "loss": 0.7722, "reward": null, "learning_rate": 3.972487714643822e-06, "epoch": 1.64, "percentage": 81.82, "elapsed_time": "15:33:58", "remaining_time": "3:27:28"} +{"current_steps": 5780, "total_steps": 7064, "loss": 0.7722, "reward": null, "learning_rate": 3.972487714643822e-06, "epoch": 1.64, "percentage": 81.82, "elapsed_time": "15:33:56", "remaining_time": "3:27:28"} +{"current_steps": 5790, "total_steps": 7064, "loss": 0.7689, "reward": null, "learning_rate": 3.9125592135657475e-06, "epoch": 1.64, "percentage": 81.96, "elapsed_time": "15:35:32", "remaining_time": "3:25:51"} +{"current_steps": 5790, "total_steps": 7064, "loss": 0.7689, "reward": null, "learning_rate": 3.9125592135657475e-06, "epoch": 1.64, "percentage": 81.96, "elapsed_time": "15:35:33", "remaining_time": "3:25:51"} +{"current_steps": 5790, "total_steps": 7064, "loss": 0.7689, "reward": null, "learning_rate": 3.9125592135657475e-06, "epoch": 1.64, "percentage": 81.96, "elapsed_time": "15:35:34", "remaining_time": "3:25:51"} +{"current_steps": 5790, "total_steps": 7064, "loss": 0.7689, "reward": null, "learning_rate": 3.9125592135657475e-06, "epoch": 1.64, "percentage": 81.96, "elapsed_time": "15:39:27", "remaining_time": "3:26:42"} +{"current_steps": 5800, "total_steps": 7064, "loss": 0.788, "reward": null, "learning_rate": 3.853047794561743e-06, "epoch": 1.64, "percentage": 82.11, "elapsed_time": "15:37:09", "remaining_time": "3:24:14"} +{"current_steps": 5800, "total_steps": 7064, "loss": 0.788, "reward": null, "learning_rate": 3.853047794561743e-06, "epoch": 1.64, "percentage": 82.11, "elapsed_time": "15:37:10", "remaining_time": "3:24:14"} +{"current_steps": 5800, "total_steps": 7064, "loss": 0.788, "reward": null, "learning_rate": 3.853047794561743e-06, "epoch": 1.64, "percentage": 82.11, "elapsed_time": "15:37:08", "remaining_time": "3:24:13"} +{"current_steps": 5800, "total_steps": 7064, "loss": 0.788, "reward": null, "learning_rate": 3.853047794561743e-06, "epoch": 1.64, "percentage": 82.11, "elapsed_time": "15:41:03", "remaining_time": "3:25:05"} +{"current_steps": 5810, "total_steps": 7064, "loss": 0.7705, "reward": null, "learning_rate": 3.7939546346900417e-06, "epoch": 1.64, "percentage": 82.25, "elapsed_time": "15:38:45", "remaining_time": "3:22:37"} +{"current_steps": 5810, "total_steps": 7064, "loss": 0.7705, "reward": null, "learning_rate": 3.7939546346900417e-06, "epoch": 1.64, "percentage": 82.25, "elapsed_time": "15:42:39", "remaining_time": "3:23:27"} +{"current_steps": 5810, "total_steps": 7064, "loss": 0.7705, "reward": null, "learning_rate": 3.7939546346900417e-06, "epoch": 1.64, "percentage": 82.25, "elapsed_time": "15:38:46", "remaining_time": "3:22:37"} +{"current_steps": 5810, "total_steps": 7064, "loss": 0.7705, "reward": null, "learning_rate": 3.7939546346900417e-06, "epoch": 1.64, "percentage": 82.25, "elapsed_time": "15:38:45", "remaining_time": "3:22:36"} +{"current_steps": 5820, "total_steps": 7064, "loss": 0.7591, "reward": null, "learning_rate": 3.7352809027362796e-06, "epoch": 1.65, "percentage": 82.39, "elapsed_time": "15:44:19", "remaining_time": "3:21:50"} +{"current_steps": 5820, "total_steps": 7064, "loss": 0.7591, "reward": null, "learning_rate": 3.7352809027362796e-06, "epoch": 1.65, "percentage": 82.39, "elapsed_time": "15:40:26", "remaining_time": "3:21:00"} +{"current_steps": 5820, "total_steps": 7064, "loss": 0.7591, "reward": null, "learning_rate": 3.7352809027362796e-06, "epoch": 1.65, "percentage": 82.39, "elapsed_time": "15:40:25", "remaining_time": "3:21:00"} +{"current_steps": 5820, "total_steps": 7064, "loss": 0.7591, "reward": null, "learning_rate": 3.7352809027362796e-06, "epoch": 1.65, "percentage": 82.39, "elapsed_time": "15:40:24", "remaining_time": "3:21:00"} +{"current_steps": 5830, "total_steps": 7064, "loss": 0.7587, "reward": null, "learning_rate": 3.6770277591903462e-06, "epoch": 1.65, "percentage": 82.53, "elapsed_time": "15:42:02", "remaining_time": "3:19:23"} +{"current_steps": 5830, "total_steps": 7064, "loss": 0.7587, "reward": null, "learning_rate": 3.6770277591903462e-06, "epoch": 1.65, "percentage": 82.53, "elapsed_time": "15:42:03", "remaining_time": "3:19:24"} +{"current_steps": 5830, "total_steps": 7064, "loss": 0.7587, "reward": null, "learning_rate": 3.6770277591903462e-06, "epoch": 1.65, "percentage": 82.53, "elapsed_time": "15:45:56", "remaining_time": "3:20:13"} +{"current_steps": 5830, "total_steps": 7064, "loss": 0.7587, "reward": null, "learning_rate": 3.6770277591903462e-06, "epoch": 1.65, "percentage": 82.53, "elapsed_time": "15:42:02", "remaining_time": "3:19:23"} +{"current_steps": 5840, "total_steps": 7064, "loss": 0.7782, "reward": null, "learning_rate": 3.619196356223439e-06, "epoch": 1.65, "percentage": 82.67, "elapsed_time": "15:43:38", "remaining_time": "3:17:46"} +{"current_steps": 5840, "total_steps": 7064, "loss": 0.7782, "reward": null, "learning_rate": 3.619196356223439e-06, "epoch": 1.65, "percentage": 82.67, "elapsed_time": "15:47:32", "remaining_time": "3:18:35"} +{"current_steps": 5840, "total_steps": 7064, "loss": 0.7782, "reward": null, "learning_rate": 3.619196356223439e-06, "epoch": 1.65, "percentage": 82.67, "elapsed_time": "15:43:39", "remaining_time": "3:17:46"} +{"current_steps": 5840, "total_steps": 7064, "loss": 0.7782, "reward": null, "learning_rate": 3.619196356223439e-06, "epoch": 1.65, "percentage": 82.67, "elapsed_time": "15:43:39", "remaining_time": "3:17:46"} +{"current_steps": 5850, "total_steps": 7064, "loss": 0.7811, "reward": null, "learning_rate": 3.5617878376652785e-06, "epoch": 1.66, "percentage": 82.81, "elapsed_time": "15:45:10", "remaining_time": "3:16:08"} +{"current_steps": 5850, "total_steps": 7064, "loss": 0.7811, "reward": null, "learning_rate": 3.5617878376652785e-06, "epoch": 1.66, "percentage": 82.81, "elapsed_time": "15:45:12", "remaining_time": "3:16:09"} +{"current_steps": 5850, "total_steps": 7064, "loss": 0.7811, "reward": null, "learning_rate": 3.5617878376652785e-06, "epoch": 1.66, "percentage": 82.81, "elapsed_time": "15:45:11", "remaining_time": "3:16:08"} +{"current_steps": 5850, "total_steps": 7064, "loss": 0.7811, "reward": null, "learning_rate": 3.5617878376652785e-06, "epoch": 1.66, "percentage": 82.81, "elapsed_time": "15:49:05", "remaining_time": "3:16:57"} +{"current_steps": 5860, "total_steps": 7064, "loss": 0.786, "reward": null, "learning_rate": 3.504803338981472e-06, "epoch": 1.66, "percentage": 82.96, "elapsed_time": "15:50:40", "remaining_time": "3:15:19"} +{"current_steps": 5860, "total_steps": 7064, "loss": 0.786, "reward": null, "learning_rate": 3.504803338981472e-06, "epoch": 1.66, "percentage": 82.96, "elapsed_time": "15:46:46", "remaining_time": "3:14:31"} +{"current_steps": 5860, "total_steps": 7064, "loss": 0.786, "reward": null, "learning_rate": 3.504803338981472e-06, "epoch": 1.66, "percentage": 82.96, "elapsed_time": "15:46:47", "remaining_time": "3:14:31"} +{"current_steps": 5860, "total_steps": 7064, "loss": 0.786, "reward": null, "learning_rate": 3.504803338981472e-06, "epoch": 1.66, "percentage": 82.96, "elapsed_time": "15:46:45", "remaining_time": "3:14:31"} +{"current_steps": 5870, "total_steps": 7064, "loss": 0.7911, "reward": null, "learning_rate": 3.448243987251093e-06, "epoch": 1.66, "percentage": 83.1, "elapsed_time": "15:48:25", "remaining_time": "3:12:55"} +{"current_steps": 5870, "total_steps": 7064, "loss": 0.7911, "reward": null, "learning_rate": 3.448243987251093e-06, "epoch": 1.66, "percentage": 83.1, "elapsed_time": "15:48:26", "remaining_time": "3:12:55"} +{"current_steps": 5870, "total_steps": 7064, "loss": 0.7911, "reward": null, "learning_rate": 3.448243987251093e-06, "epoch": 1.66, "percentage": 83.1, "elapsed_time": "15:48:27", "remaining_time": "3:12:55"} +{"current_steps": 5870, "total_steps": 7064, "loss": 0.7911, "reward": null, "learning_rate": 3.448243987251093e-06, "epoch": 1.66, "percentage": 83.1, "elapsed_time": "15:52:20", "remaining_time": "3:13:42"} +{"current_steps": 5880, "total_steps": 7064, "loss": 0.7706, "reward": null, "learning_rate": 3.3921109011443354e-06, "epoch": 1.66, "percentage": 83.24, "elapsed_time": "15:50:06", "remaining_time": "3:11:18"} +{"current_steps": 5880, "total_steps": 7064, "loss": 0.7706, "reward": null, "learning_rate": 3.3921109011443354e-06, "epoch": 1.66, "percentage": 83.24, "elapsed_time": "15:53:59", "remaining_time": "3:12:05"} +{"current_steps": 5880, "total_steps": 7064, "loss": 0.7706, "reward": null, "learning_rate": 3.3921109011443354e-06, "epoch": 1.66, "percentage": 83.24, "elapsed_time": "15:50:05", "remaining_time": "3:11:18"} +{"current_steps": 5880, "total_steps": 7064, "loss": 0.7706, "reward": null, "learning_rate": 3.3921109011443354e-06, "epoch": 1.66, "percentage": 83.24, "elapsed_time": "15:50:06", "remaining_time": "3:11:18"} +{"current_steps": 5890, "total_steps": 7064, "loss": 0.7913, "reward": null, "learning_rate": 3.336405190900438e-06, "epoch": 1.67, "percentage": 83.38, "elapsed_time": "15:51:43", "remaining_time": "3:09:41"} +{"current_steps": 5890, "total_steps": 7064, "loss": 0.7913, "reward": null, "learning_rate": 3.336405190900438e-06, "epoch": 1.67, "percentage": 83.38, "elapsed_time": "15:55:38", "remaining_time": "3:10:28"} +{"current_steps": 5890, "total_steps": 7064, "loss": 0.7913, "reward": null, "learning_rate": 3.336405190900438e-06, "epoch": 1.67, "percentage": 83.38, "elapsed_time": "15:51:44", "remaining_time": "3:09:42"} +{"current_steps": 5890, "total_steps": 7064, "loss": 0.7913, "reward": null, "learning_rate": 3.336405190900438e-06, "epoch": 1.67, "percentage": 83.38, "elapsed_time": "15:51:45", "remaining_time": "3:09:42"} +{"current_steps": 5900, "total_steps": 7064, "loss": 0.7849, "reward": null, "learning_rate": 3.2811279583056825e-06, "epoch": 1.67, "percentage": 83.52, "elapsed_time": "15:53:21", "remaining_time": "3:08:05"} +{"current_steps": 5900, "total_steps": 7064, "loss": 0.7849, "reward": null, "learning_rate": 3.2811279583056825e-06, "epoch": 1.67, "percentage": 83.52, "elapsed_time": "15:53:22", "remaining_time": "3:08:05"} +{"current_steps": 5900, "total_steps": 7064, "loss": 0.7849, "reward": null, "learning_rate": 3.2811279583056825e-06, "epoch": 1.67, "percentage": 83.52, "elapsed_time": "15:53:23", "remaining_time": "3:08:05"} +{"current_steps": 5900, "total_steps": 7064, "loss": 0.7849, "reward": null, "learning_rate": 3.2811279583056825e-06, "epoch": 1.67, "percentage": 83.52, "elapsed_time": "15:57:16", "remaining_time": "3:08:51"} +{"current_steps": 5910, "total_steps": 7064, "loss": 0.7759, "reward": null, "learning_rate": 3.2262802966716383e-06, "epoch": 1.67, "percentage": 83.66, "elapsed_time": "15:58:53", "remaining_time": "3:07:14"} +{"current_steps": 5910, "total_steps": 7064, "loss": 0.7759, "reward": null, "learning_rate": 3.2262802966716383e-06, "epoch": 1.67, "percentage": 83.66, "elapsed_time": "15:54:59", "remaining_time": "3:06:28"} +{"current_steps": 5910, "total_steps": 7064, "loss": 0.7759, "reward": null, "learning_rate": 3.2262802966716383e-06, "epoch": 1.67, "percentage": 83.66, "elapsed_time": "15:55:00", "remaining_time": "3:06:28"} +{"current_steps": 5910, "total_steps": 7064, "loss": 0.7759, "reward": null, "learning_rate": 3.2262802966716383e-06, "epoch": 1.67, "percentage": 83.66, "elapsed_time": "15:55:00", "remaining_time": "3:06:28"} +{"current_steps": 5920, "total_steps": 7064, "loss": 0.8093, "reward": null, "learning_rate": 3.171863290813509e-06, "epoch": 1.68, "percentage": 83.81, "elapsed_time": "15:56:42", "remaining_time": "3:04:52"} +{"current_steps": 5920, "total_steps": 7064, "loss": 0.8093, "reward": null, "learning_rate": 3.171863290813509e-06, "epoch": 1.68, "percentage": 83.81, "elapsed_time": "15:56:42", "remaining_time": "3:04:52"} +{"current_steps": 5920, "total_steps": 7064, "loss": 0.8093, "reward": null, "learning_rate": 3.171863290813509e-06, "epoch": 1.68, "percentage": 83.81, "elapsed_time": "16:00:35", "remaining_time": "3:05:37"} +{"current_steps": 5920, "total_steps": 7064, "loss": 0.8093, "reward": null, "learning_rate": 3.171863290813509e-06, "epoch": 1.68, "percentage": 83.81, "elapsed_time": "15:56:41", "remaining_time": "3:04:52"} +{"current_steps": 5930, "total_steps": 7064, "loss": 0.7634, "reward": null, "learning_rate": 3.117878017028697e-06, "epoch": 1.68, "percentage": 83.95, "elapsed_time": "15:58:17", "remaining_time": "3:03:15"} +{"current_steps": 5930, "total_steps": 7064, "loss": 0.7634, "reward": null, "learning_rate": 3.117878017028697e-06, "epoch": 1.68, "percentage": 83.95, "elapsed_time": "15:58:16", "remaining_time": "3:03:15"} +{"current_steps": 5930, "total_steps": 7064, "loss": 0.7634, "reward": null, "learning_rate": 3.117878017028697e-06, "epoch": 1.68, "percentage": 83.95, "elapsed_time": "16:02:11", "remaining_time": "3:04:00"} +{"current_steps": 5930, "total_steps": 7064, "loss": 0.7634, "reward": null, "learning_rate": 3.117878017028697e-06, "epoch": 1.68, "percentage": 83.95, "elapsed_time": "15:58:18", "remaining_time": "3:03:15"} +{"current_steps": 5940, "total_steps": 7064, "loss": 0.777, "reward": null, "learning_rate": 3.064325543075494e-06, "epoch": 1.68, "percentage": 84.09, "elapsed_time": "15:59:54", "remaining_time": "3:01:38"} +{"current_steps": 5940, "total_steps": 7064, "loss": 0.777, "reward": null, "learning_rate": 3.064325543075494e-06, "epoch": 1.68, "percentage": 84.09, "elapsed_time": "15:59:55", "remaining_time": "3:01:38"} +{"current_steps": 5940, "total_steps": 7064, "loss": 0.777, "reward": null, "learning_rate": 3.064325543075494e-06, "epoch": 1.68, "percentage": 84.09, "elapsed_time": "15:59:56", "remaining_time": "3:01:38"} +{"current_steps": 5940, "total_steps": 7064, "loss": 0.777, "reward": null, "learning_rate": 3.064325543075494e-06, "epoch": 1.68, "percentage": 84.09, "elapsed_time": "16:03:49", "remaining_time": "3:02:22"} +{"current_steps": 5950, "total_steps": 7064, "loss": 0.7794, "reward": null, "learning_rate": 3.0112069281519994e-06, "epoch": 1.68, "percentage": 84.23, "elapsed_time": "16:01:30", "remaining_time": "3:00:01"} +{"current_steps": 5950, "total_steps": 7064, "loss": 0.7794, "reward": null, "learning_rate": 3.0112069281519994e-06, "epoch": 1.68, "percentage": 84.23, "elapsed_time": "16:01:31", "remaining_time": "3:00:01"} +{"current_steps": 5950, "total_steps": 7064, "loss": 0.7794, "reward": null, "learning_rate": 3.0112069281519994e-06, "epoch": 1.68, "percentage": 84.23, "elapsed_time": "16:05:24", "remaining_time": "3:00:44"} +{"current_steps": 5950, "total_steps": 7064, "loss": 0.7794, "reward": null, "learning_rate": 3.0112069281519994e-06, "epoch": 1.68, "percentage": 84.23, "elapsed_time": "16:01:29", "remaining_time": "3:00:01"} +{"current_steps": 5960, "total_steps": 7064, "loss": 0.7703, "reward": null, "learning_rate": 2.9585232228751204e-06, "epoch": 1.69, "percentage": 84.37, "elapsed_time": "16:03:08", "remaining_time": "2:58:24"} +{"current_steps": 5960, "total_steps": 7064, "loss": 0.7703, "reward": null, "learning_rate": 2.9585232228751204e-06, "epoch": 1.69, "percentage": 84.37, "elapsed_time": "16:07:03", "remaining_time": "2:59:07"} +{"current_steps": 5960, "total_steps": 7064, "loss": 0.7703, "reward": null, "learning_rate": 2.9585232228751204e-06, "epoch": 1.69, "percentage": 84.37, "elapsed_time": "16:03:10", "remaining_time": "2:58:24"} +{"current_steps": 5960, "total_steps": 7064, "loss": 0.7703, "reward": null, "learning_rate": 2.9585232228751204e-06, "epoch": 1.69, "percentage": 84.37, "elapsed_time": "16:03:09", "remaining_time": "2:58:24"} +{"current_steps": 5970, "total_steps": 7064, "loss": 0.7725, "reward": null, "learning_rate": 2.906275469259839e-06, "epoch": 1.69, "percentage": 84.51, "elapsed_time": "16:04:48", "remaining_time": "2:56:47"} +{"current_steps": 5970, "total_steps": 7064, "loss": 0.7725, "reward": null, "learning_rate": 2.906275469259839e-06, "epoch": 1.69, "percentage": 84.51, "elapsed_time": "16:04:49", "remaining_time": "2:56:48"} +{"current_steps": 5970, "total_steps": 7064, "loss": 0.7725, "reward": null, "learning_rate": 2.906275469259839e-06, "epoch": 1.69, "percentage": 84.51, "elapsed_time": "16:04:49", "remaining_time": "2:56:48"} +{"current_steps": 5970, "total_steps": 7064, "loss": 0.7725, "reward": null, "learning_rate": 2.906275469259839e-06, "epoch": 1.69, "percentage": 84.51, "elapsed_time": "16:08:42", "remaining_time": "2:57:30"} +{"current_steps": 5980, "total_steps": 7064, "loss": 0.7913, "reward": null, "learning_rate": 2.8544647006985724e-06, "epoch": 1.69, "percentage": 84.65, "elapsed_time": "16:06:25", "remaining_time": "2:55:11"} +{"current_steps": 5980, "total_steps": 7064, "loss": 0.7913, "reward": null, "learning_rate": 2.8544647006985724e-06, "epoch": 1.69, "percentage": 84.65, "elapsed_time": "16:06:27", "remaining_time": "2:55:11"} +{"current_steps": 5980, "total_steps": 7064, "loss": 0.7913, "reward": null, "learning_rate": 2.8544647006985724e-06, "epoch": 1.69, "percentage": 84.65, "elapsed_time": "16:06:26", "remaining_time": "2:55:11"} +{"current_steps": 5980, "total_steps": 7064, "loss": 0.7913, "reward": null, "learning_rate": 2.8544647006985724e-06, "epoch": 1.69, "percentage": 84.65, "elapsed_time": "16:10:20", "remaining_time": "2:55:53"} +{"current_steps": 5990, "total_steps": 7064, "loss": 0.7897, "reward": null, "learning_rate": 2.803091941940747e-06, "epoch": 1.7, "percentage": 84.8, "elapsed_time": "16:11:54", "remaining_time": "2:54:15"} +{"current_steps": 5990, "total_steps": 7064, "loss": 0.7897, "reward": null, "learning_rate": 2.803091941940747e-06, "epoch": 1.7, "percentage": 84.8, "elapsed_time": "16:08:01", "remaining_time": "2:53:33"} +{"current_steps": 5990, "total_steps": 7064, "loss": 0.7897, "reward": null, "learning_rate": 2.803091941940747e-06, "epoch": 1.7, "percentage": 84.8, "elapsed_time": "16:08:02", "remaining_time": "2:53:34"} +{"current_steps": 5990, "total_steps": 7064, "loss": 0.7897, "reward": null, "learning_rate": 2.803091941940747e-06, "epoch": 1.7, "percentage": 84.8, "elapsed_time": "16:08:00", "remaining_time": "2:53:33"} +{"current_steps": 6000, "total_steps": 7064, "loss": 0.7785, "reward": null, "learning_rate": 2.752158209072522e-06, "epoch": 1.7, "percentage": 84.94, "elapsed_time": "16:09:44", "remaining_time": "2:51:58"} +{"current_steps": 6000, "total_steps": 7064, "loss": 0.7785, "reward": null, "learning_rate": 2.752158209072522e-06, "epoch": 1.7, "percentage": 84.94, "elapsed_time": "16:09:42", "remaining_time": "2:51:57"} +{"current_steps": 6000, "total_steps": 7064, "loss": 0.7785, "reward": null, "learning_rate": 2.752158209072522e-06, "epoch": 1.7, "percentage": 84.94, "elapsed_time": "16:09:43", "remaining_time": "2:51:57"} +{"current_steps": 6000, "total_steps": 7064, "loss": 0.7785, "reward": null, "learning_rate": 2.752158209072522e-06, "epoch": 1.7, "percentage": 84.94, "elapsed_time": "16:13:37", "remaining_time": "2:52:39"} +{"current_steps": 6010, "total_steps": 7064, "loss": 0.7742, "reward": null, "learning_rate": 2.701664509496701e-06, "epoch": 1.7, "percentage": 85.08, "elapsed_time": "16:11:20", "remaining_time": "2:50:20"} +{"current_steps": 6010, "total_steps": 7064, "loss": 0.7742, "reward": null, "learning_rate": 2.701664509496701e-06, "epoch": 1.7, "percentage": 85.08, "elapsed_time": "16:11:19", "remaining_time": "2:50:20"} +{"current_steps": 6010, "total_steps": 7064, "loss": 0.7742, "reward": null, "learning_rate": 2.701664509496701e-06, "epoch": 1.7, "percentage": 85.08, "elapsed_time": "16:15:14", "remaining_time": "2:51:01"} +{"current_steps": 6010, "total_steps": 7064, "loss": 0.7742, "reward": null, "learning_rate": 2.701664509496701e-06, "epoch": 1.7, "percentage": 85.08, "elapsed_time": "16:11:21", "remaining_time": "2:50:21"} +{"current_steps": 6020, "total_steps": 7064, "loss": 0.7742, "reward": null, "learning_rate": 2.651611841912796e-06, "epoch": 1.7, "percentage": 85.22, "elapsed_time": "16:13:00", "remaining_time": "2:48:44"} +{"current_steps": 6020, "total_steps": 7064, "loss": 0.7742, "reward": null, "learning_rate": 2.651611841912796e-06, "epoch": 1.7, "percentage": 85.22, "elapsed_time": "16:12:59", "remaining_time": "2:48:44"} +{"current_steps": 6020, "total_steps": 7064, "loss": 0.7742, "reward": null, "learning_rate": 2.651611841912796e-06, "epoch": 1.7, "percentage": 85.22, "elapsed_time": "16:16:53", "remaining_time": "2:49:24"} +{"current_steps": 6020, "total_steps": 7064, "loss": 0.7742, "reward": null, "learning_rate": 2.651611841912796e-06, "epoch": 1.7, "percentage": 85.22, "elapsed_time": "16:12:58", "remaining_time": "2:48:44"} +{"current_steps": 6030, "total_steps": 7064, "loss": 0.7947, "reward": null, "learning_rate": 2.602001196297299e-06, "epoch": 1.71, "percentage": 85.36, "elapsed_time": "16:14:35", "remaining_time": "2:47:07"} +{"current_steps": 6030, "total_steps": 7064, "loss": 0.7947, "reward": null, "learning_rate": 2.602001196297299e-06, "epoch": 1.71, "percentage": 85.36, "elapsed_time": "16:14:36", "remaining_time": "2:47:07"} +{"current_steps": 6030, "total_steps": 7064, "loss": 0.7947, "reward": null, "learning_rate": 2.602001196297299e-06, "epoch": 1.71, "percentage": 85.36, "elapsed_time": "16:14:37", "remaining_time": "2:47:07"} +{"current_steps": 6030, "total_steps": 7064, "loss": 0.7947, "reward": null, "learning_rate": 2.602001196297299e-06, "epoch": 1.71, "percentage": 85.36, "elapsed_time": "16:18:30", "remaining_time": "2:47:47"} +{"current_steps": 6040, "total_steps": 7064, "loss": 0.7842, "reward": null, "learning_rate": 2.5528335538840597e-06, "epoch": 1.71, "percentage": 85.5, "elapsed_time": "16:16:14", "remaining_time": "2:45:30"} +{"current_steps": 6040, "total_steps": 7064, "loss": 0.7842, "reward": null, "learning_rate": 2.5528335538840597e-06, "epoch": 1.71, "percentage": 85.5, "elapsed_time": "16:20:07", "remaining_time": "2:46:09"} +{"current_steps": 6040, "total_steps": 7064, "loss": 0.7842, "reward": null, "learning_rate": 2.5528335538840597e-06, "epoch": 1.71, "percentage": 85.5, "elapsed_time": "16:16:13", "remaining_time": "2:45:30"} +{"current_steps": 6040, "total_steps": 7064, "loss": 0.7842, "reward": null, "learning_rate": 2.5528335538840597e-06, "epoch": 1.71, "percentage": 85.5, "elapsed_time": "16:16:12", "remaining_time": "2:45:30"} +{"current_steps": 6050, "total_steps": 7064, "loss": 0.7738, "reward": null, "learning_rate": 2.5041098871449204e-06, "epoch": 1.71, "percentage": 85.65, "elapsed_time": "16:17:45", "remaining_time": "2:43:52"} +{"current_steps": 6050, "total_steps": 7064, "loss": 0.7738, "reward": null, "learning_rate": 2.5041098871449204e-06, "epoch": 1.71, "percentage": 85.65, "elapsed_time": "16:17:46", "remaining_time": "2:43:52"} +{"current_steps": 6050, "total_steps": 7064, "loss": 0.7738, "reward": null, "learning_rate": 2.5041098871449204e-06, "epoch": 1.71, "percentage": 85.65, "elapsed_time": "16:17:46", "remaining_time": "2:43:52"} +{"current_steps": 6050, "total_steps": 7064, "loss": 0.7738, "reward": null, "learning_rate": 2.5041098871449204e-06, "epoch": 1.71, "percentage": 85.65, "elapsed_time": "16:21:39", "remaining_time": "2:44:31"} +{"current_steps": 6060, "total_steps": 7064, "loss": 0.778, "reward": null, "learning_rate": 2.4558311597704636e-06, "epoch": 1.72, "percentage": 85.79, "elapsed_time": "16:19:20", "remaining_time": "2:42:15"} +{"current_steps": 6060, "total_steps": 7064, "loss": 0.778, "reward": null, "learning_rate": 2.4558311597704636e-06, "epoch": 1.72, "percentage": 85.79, "elapsed_time": "16:19:22", "remaining_time": "2:42:15"} +{"current_steps": 6060, "total_steps": 7064, "loss": 0.778, "reward": null, "learning_rate": 2.4558311597704636e-06, "epoch": 1.72, "percentage": 85.79, "elapsed_time": "16:19:21", "remaining_time": "2:42:15"} +{"current_steps": 6060, "total_steps": 7064, "loss": 0.778, "reward": null, "learning_rate": 2.4558311597704636e-06, "epoch": 1.72, "percentage": 85.79, "elapsed_time": "16:23:15", "remaining_time": "2:42:54"} +{"current_steps": 6070, "total_steps": 7064, "loss": 0.772, "reward": null, "learning_rate": 2.40799832665094e-06, "epoch": 1.72, "percentage": 85.93, "elapsed_time": "16:20:58", "remaining_time": "2:40:38"} +{"current_steps": 6070, "total_steps": 7064, "loss": 0.772, "reward": null, "learning_rate": 2.40799832665094e-06, "epoch": 1.72, "percentage": 85.93, "elapsed_time": "16:24:53", "remaining_time": "2:41:16"} +{"current_steps": 6070, "total_steps": 7064, "loss": 0.772, "reward": null, "learning_rate": 2.40799832665094e-06, "epoch": 1.72, "percentage": 85.93, "elapsed_time": "16:21:00", "remaining_time": "2:40:38"} +{"current_steps": 6070, "total_steps": 7064, "loss": 0.772, "reward": null, "learning_rate": 2.40799832665094e-06, "epoch": 1.72, "percentage": 85.93, "elapsed_time": "16:20:59", "remaining_time": "2:40:38"} +{"current_steps": 6080, "total_steps": 7064, "loss": 0.7742, "reward": null, "learning_rate": 2.360612333857401e-06, "epoch": 1.72, "percentage": 86.07, "elapsed_time": "16:26:29", "remaining_time": "2:39:39"} +{"current_steps": 6080, "total_steps": 7064, "loss": 0.7742, "reward": null, "learning_rate": 2.360612333857401e-06, "epoch": 1.72, "percentage": 86.07, "elapsed_time": "16:22:35", "remaining_time": "2:39:01"} +{"current_steps": 6080, "total_steps": 7064, "loss": 0.7742, "reward": null, "learning_rate": 2.360612333857401e-06, "epoch": 1.72, "percentage": 86.07, "elapsed_time": "16:22:36", "remaining_time": "2:39:01"} +{"current_steps": 6080, "total_steps": 7064, "loss": 0.7742, "reward": null, "learning_rate": 2.360612333857401e-06, "epoch": 1.72, "percentage": 86.07, "elapsed_time": "16:22:34", "remaining_time": "2:39:01"} +{"current_steps": 6090, "total_steps": 7064, "loss": 0.7846, "reward": null, "learning_rate": 2.31367411862298e-06, "epoch": 1.72, "percentage": 86.21, "elapsed_time": "16:24:07", "remaining_time": "2:37:23"} +{"current_steps": 6090, "total_steps": 7064, "loss": 0.7846, "reward": null, "learning_rate": 2.31367411862298e-06, "epoch": 1.72, "percentage": 86.21, "elapsed_time": "16:28:02", "remaining_time": "2:38:01"} +{"current_steps": 6090, "total_steps": 7064, "loss": 0.7846, "reward": null, "learning_rate": 2.31367411862298e-06, "epoch": 1.72, "percentage": 86.21, "elapsed_time": "16:24:09", "remaining_time": "2:37:24"} +{"current_steps": 6090, "total_steps": 7064, "loss": 0.7846, "reward": null, "learning_rate": 2.31367411862298e-06, "epoch": 1.72, "percentage": 86.21, "elapsed_time": "16:24:08", "remaining_time": "2:37:23"} +{"current_steps": 6100, "total_steps": 7064, "loss": 0.785, "reward": null, "learning_rate": 2.2671846093243493e-06, "epoch": 1.73, "percentage": 86.35, "elapsed_time": "16:29:40", "remaining_time": "2:36:24"} +{"current_steps": 6100, "total_steps": 7064, "loss": 0.785, "reward": null, "learning_rate": 2.2671846093243493e-06, "epoch": 1.73, "percentage": 86.35, "elapsed_time": "16:25:45", "remaining_time": "2:35:47"} +{"current_steps": 6100, "total_steps": 7064, "loss": 0.785, "reward": null, "learning_rate": 2.2671846093243493e-06, "epoch": 1.73, "percentage": 86.35, "elapsed_time": "16:25:47", "remaining_time": "2:35:47"} +{"current_steps": 6100, "total_steps": 7064, "loss": 0.785, "reward": null, "learning_rate": 2.2671846093243493e-06, "epoch": 1.73, "percentage": 86.35, "elapsed_time": "16:25:46", "remaining_time": "2:35:47"} +{"current_steps": 6110, "total_steps": 7064, "loss": 0.7846, "reward": null, "learning_rate": 2.221144725463359e-06, "epoch": 1.73, "percentage": 86.49, "elapsed_time": "16:27:26", "remaining_time": "2:34:10"} +{"current_steps": 6110, "total_steps": 7064, "loss": 0.7846, "reward": null, "learning_rate": 2.221144725463359e-06, "epoch": 1.73, "percentage": 86.49, "elapsed_time": "16:27:27", "remaining_time": "2:34:10"} +{"current_steps": 6110, "total_steps": 7064, "loss": 0.7846, "reward": null, "learning_rate": 2.221144725463359e-06, "epoch": 1.73, "percentage": 86.49, "elapsed_time": "16:27:28", "remaining_time": "2:34:10"} +{"current_steps": 6110, "total_steps": 7064, "loss": 0.7846, "reward": null, "learning_rate": 2.221144725463359e-06, "epoch": 1.73, "percentage": 86.49, "elapsed_time": "16:31:20", "remaining_time": "2:34:47"} +{"current_steps": 6120, "total_steps": 7064, "loss": 0.797, "reward": null, "learning_rate": 2.1755553776488745e-06, "epoch": 1.73, "percentage": 86.64, "elapsed_time": "16:33:00", "remaining_time": "2:33:10"} +{"current_steps": 6120, "total_steps": 7064, "loss": 0.797, "reward": null, "learning_rate": 2.1755553776488745e-06, "epoch": 1.73, "percentage": 86.64, "elapsed_time": "16:29:06", "remaining_time": "2:32:34"} +{"current_steps": 6120, "total_steps": 7064, "loss": 0.797, "reward": null, "learning_rate": 2.1755553776488745e-06, "epoch": 1.73, "percentage": 86.64, "elapsed_time": "16:29:07", "remaining_time": "2:32:34"} +{"current_steps": 6120, "total_steps": 7064, "loss": 0.797, "reward": null, "learning_rate": 2.1755553776488745e-06, "epoch": 1.73, "percentage": 86.64, "elapsed_time": "16:29:05", "remaining_time": "2:32:33"} +{"current_steps": 6130, "total_steps": 7064, "loss": 0.7936, "reward": null, "learning_rate": 2.130417467578724e-06, "epoch": 1.74, "percentage": 86.78, "elapsed_time": "16:30:43", "remaining_time": "2:30:57"} +{"current_steps": 6130, "total_steps": 7064, "loss": 0.7936, "reward": null, "learning_rate": 2.130417467578724e-06, "epoch": 1.74, "percentage": 86.78, "elapsed_time": "16:30:42", "remaining_time": "2:30:57"} +{"current_steps": 6130, "total_steps": 7064, "loss": 0.7936, "reward": null, "learning_rate": 2.130417467578724e-06, "epoch": 1.74, "percentage": 86.78, "elapsed_time": "16:30:44", "remaining_time": "2:30:57"} +{"current_steps": 6130, "total_steps": 7064, "loss": 0.7936, "reward": null, "learning_rate": 2.130417467578724e-06, "epoch": 1.74, "percentage": 86.78, "elapsed_time": "16:34:37", "remaining_time": "2:31:32"} +{"current_steps": 6140, "total_steps": 7064, "loss": 0.7785, "reward": null, "learning_rate": 2.0857318880218995e-06, "epoch": 1.74, "percentage": 86.92, "elapsed_time": "16:32:18", "remaining_time": "2:29:19"} +{"current_steps": 6140, "total_steps": 7064, "loss": 0.7785, "reward": null, "learning_rate": 2.0857318880218995e-06, "epoch": 1.74, "percentage": 86.92, "elapsed_time": "16:32:17", "remaining_time": "2:29:19"} +{"current_steps": 6140, "total_steps": 7064, "loss": 0.7785, "reward": null, "learning_rate": 2.0857318880218995e-06, "epoch": 1.74, "percentage": 86.92, "elapsed_time": "16:32:19", "remaining_time": "2:29:19"} +{"current_steps": 6140, "total_steps": 7064, "loss": 0.7785, "reward": null, "learning_rate": 2.0857318880218995e-06, "epoch": 1.74, "percentage": 86.92, "elapsed_time": "16:36:12", "remaining_time": "2:29:55"} +{"current_steps": 6150, "total_steps": 7064, "loss": 0.7619, "reward": null, "learning_rate": 2.0414995228008743e-06, "epoch": 1.74, "percentage": 87.06, "elapsed_time": "16:37:47", "remaining_time": "2:28:17"} +{"current_steps": 6150, "total_steps": 7064, "loss": 0.7619, "reward": null, "learning_rate": 2.0414995228008743e-06, "epoch": 1.74, "percentage": 87.06, "elapsed_time": "16:33:54", "remaining_time": "2:27:42"} +{"current_steps": 6150, "total_steps": 7064, "loss": 0.7619, "reward": null, "learning_rate": 2.0414995228008743e-06, "epoch": 1.74, "percentage": 87.06, "elapsed_time": "16:33:53", "remaining_time": "2:27:42"} +{"current_steps": 6150, "total_steps": 7064, "loss": 0.7619, "reward": null, "learning_rate": 2.0414995228008743e-06, "epoch": 1.74, "percentage": 87.06, "elapsed_time": "16:33:52", "remaining_time": "2:27:42"} +{"current_steps": 6160, "total_steps": 7064, "loss": 0.7624, "reward": null, "learning_rate": 1.997721246774145e-06, "epoch": 1.74, "percentage": 87.2, "elapsed_time": "16:35:29", "remaining_time": "2:26:05"} +{"current_steps": 6160, "total_steps": 7064, "loss": 0.7624, "reward": null, "learning_rate": 1.997721246774145e-06, "epoch": 1.74, "percentage": 87.2, "elapsed_time": "16:39:24", "remaining_time": "2:26:39"} +{"current_steps": 6160, "total_steps": 7064, "loss": 0.7624, "reward": null, "learning_rate": 1.997721246774145e-06, "epoch": 1.74, "percentage": 87.2, "elapsed_time": "16:35:31", "remaining_time": "2:26:05"} +{"current_steps": 6160, "total_steps": 7064, "loss": 0.7624, "reward": null, "learning_rate": 1.997721246774145e-06, "epoch": 1.74, "percentage": 87.2, "elapsed_time": "16:35:30", "remaining_time": "2:26:05"} +{"current_steps": 6170, "total_steps": 7064, "loss": 0.7682, "reward": null, "learning_rate": 1.9543979258189126e-06, "epoch": 1.75, "percentage": 87.34, "elapsed_time": "16:37:05", "remaining_time": "2:24:28"} +{"current_steps": 6170, "total_steps": 7064, "loss": 0.7682, "reward": null, "learning_rate": 1.9543979258189126e-06, "epoch": 1.75, "percentage": 87.34, "elapsed_time": "16:41:00", "remaining_time": "2:25:02"} +{"current_steps": 6170, "total_steps": 7064, "loss": 0.7682, "reward": null, "learning_rate": 1.9543979258189126e-06, "epoch": 1.75, "percentage": 87.34, "elapsed_time": "16:37:07", "remaining_time": "2:24:28"} +{"current_steps": 6170, "total_steps": 7064, "loss": 0.7682, "reward": null, "learning_rate": 1.9543979258189126e-06, "epoch": 1.75, "percentage": 87.34, "elapsed_time": "16:37:06", "remaining_time": "2:24:28"} +{"current_steps": 6180, "total_steps": 7064, "loss": 0.7834, "reward": null, "learning_rate": 1.911530416813953e-06, "epoch": 1.75, "percentage": 87.49, "elapsed_time": "16:42:38", "remaining_time": "2:23:25"} +{"current_steps": 6180, "total_steps": 7064, "loss": 0.7834, "reward": null, "learning_rate": 1.911530416813953e-06, "epoch": 1.75, "percentage": 87.49, "elapsed_time": "16:38:43", "remaining_time": "2:22:51"} +{"current_steps": 6180, "total_steps": 7064, "loss": 0.7834, "reward": null, "learning_rate": 1.911530416813953e-06, "epoch": 1.75, "percentage": 87.49, "elapsed_time": "16:38:44", "remaining_time": "2:22:51"} +{"current_steps": 6180, "total_steps": 7064, "loss": 0.7834, "reward": null, "learning_rate": 1.911530416813953e-06, "epoch": 1.75, "percentage": 87.49, "elapsed_time": "16:38:45", "remaining_time": "2:22:51"} +{"current_steps": 6190, "total_steps": 7064, "loss": 0.7947, "reward": null, "learning_rate": 1.869119567622679e-06, "epoch": 1.75, "percentage": 87.63, "elapsed_time": "16:40:18", "remaining_time": "2:21:14"} +{"current_steps": 6190, "total_steps": 7064, "loss": 0.7947, "reward": null, "learning_rate": 1.869119567622679e-06, "epoch": 1.75, "percentage": 87.63, "elapsed_time": "16:40:18", "remaining_time": "2:21:14"} +{"current_steps": 6190, "total_steps": 7064, "loss": 0.7947, "reward": null, "learning_rate": 1.869119567622679e-06, "epoch": 1.75, "percentage": 87.63, "elapsed_time": "16:44:12", "remaining_time": "2:21:47"} +{"current_steps": 6190, "total_steps": 7064, "loss": 0.7947, "reward": null, "learning_rate": 1.869119567622679e-06, "epoch": 1.75, "percentage": 87.63, "elapsed_time": "16:40:19", "remaining_time": "2:21:14"} +{"current_steps": 6200, "total_steps": 7064, "loss": 0.8014, "reward": null, "learning_rate": 1.8271662170763787e-06, "epoch": 1.76, "percentage": 87.77, "elapsed_time": "16:45:53", "remaining_time": "2:20:10"} +{"current_steps": 6200, "total_steps": 7064, "loss": 0.8014, "reward": null, "learning_rate": 1.8271662170763787e-06, "epoch": 1.76, "percentage": 87.77, "elapsed_time": "16:41:59", "remaining_time": "2:19:37"} +{"current_steps": 6200, "total_steps": 7064, "loss": 0.8014, "reward": null, "learning_rate": 1.8271662170763787e-06, "epoch": 1.76, "percentage": 87.77, "elapsed_time": "16:41:58", "remaining_time": "2:19:37"} +{"current_steps": 6200, "total_steps": 7064, "loss": 0.8014, "reward": null, "learning_rate": 1.8271662170763787e-06, "epoch": 1.76, "percentage": 87.77, "elapsed_time": "16:42:00", "remaining_time": "2:19:38"} +{"current_steps": 6210, "total_steps": 7064, "loss": 0.7769, "reward": null, "learning_rate": 1.7856711949575972e-06, "epoch": 1.76, "percentage": 87.91, "elapsed_time": "16:43:35", "remaining_time": "2:18:00"} +{"current_steps": 6210, "total_steps": 7064, "loss": 0.7769, "reward": null, "learning_rate": 1.7856711949575972e-06, "epoch": 1.76, "percentage": 87.91, "elapsed_time": "16:43:36", "remaining_time": "2:18:01"} +{"current_steps": 6210, "total_steps": 7064, "loss": 0.7769, "reward": null, "learning_rate": 1.7856711949575972e-06, "epoch": 1.76, "percentage": 87.91, "elapsed_time": "16:43:36", "remaining_time": "2:18:00"} +{"current_steps": 6210, "total_steps": 7064, "loss": 0.7769, "reward": null, "learning_rate": 1.7856711949575972e-06, "epoch": 1.76, "percentage": 87.91, "elapsed_time": "16:47:29", "remaining_time": "2:18:33"} +{"current_steps": 6220, "total_steps": 7064, "loss": 0.7804, "reward": null, "learning_rate": 1.7446353219837592e-06, "epoch": 1.76, "percentage": 88.05, "elapsed_time": "16:49:10", "remaining_time": "2:16:56"} +{"current_steps": 6220, "total_steps": 7064, "loss": 0.7804, "reward": null, "learning_rate": 1.7446353219837592e-06, "epoch": 1.76, "percentage": 88.05, "elapsed_time": "16:45:16", "remaining_time": "2:16:24"} +{"current_steps": 6220, "total_steps": 7064, "loss": 0.7804, "reward": null, "learning_rate": 1.7446353219837592e-06, "epoch": 1.76, "percentage": 88.05, "elapsed_time": "16:45:17", "remaining_time": "2:16:24"} +{"current_steps": 6220, "total_steps": 7064, "loss": 0.7804, "reward": null, "learning_rate": 1.7446353219837592e-06, "epoch": 1.76, "percentage": 88.05, "elapsed_time": "16:45:15", "remaining_time": "2:16:24"} +{"current_steps": 6230, "total_steps": 7064, "loss": 0.787, "reward": null, "learning_rate": 1.704059409790898e-06, "epoch": 1.76, "percentage": 88.19, "elapsed_time": "16:46:55", "remaining_time": "2:14:47"} +{"current_steps": 6230, "total_steps": 7064, "loss": 0.787, "reward": null, "learning_rate": 1.704059409790898e-06, "epoch": 1.76, "percentage": 88.19, "elapsed_time": "16:46:55", "remaining_time": "2:14:47"} +{"current_steps": 6230, "total_steps": 7064, "loss": 0.787, "reward": null, "learning_rate": 1.704059409790898e-06, "epoch": 1.76, "percentage": 88.19, "elapsed_time": "16:50:48", "remaining_time": "2:15:18"} +{"current_steps": 6230, "total_steps": 7064, "loss": 0.787, "reward": null, "learning_rate": 1.704059409790898e-06, "epoch": 1.76, "percentage": 88.19, "elapsed_time": "16:46:54", "remaining_time": "2:14:47"} +{"current_steps": 6240, "total_steps": 7064, "loss": 0.7745, "reward": null, "learning_rate": 1.6639442609176409e-06, "epoch": 1.77, "percentage": 88.34, "elapsed_time": "16:48:29", "remaining_time": "2:13:10"} +{"current_steps": 6240, "total_steps": 7064, "loss": 0.7745, "reward": null, "learning_rate": 1.6639442609176409e-06, "epoch": 1.77, "percentage": 88.34, "elapsed_time": "16:48:31", "remaining_time": "2:13:10"} +{"current_steps": 6240, "total_steps": 7064, "loss": 0.7745, "reward": null, "learning_rate": 1.6639442609176409e-06, "epoch": 1.77, "percentage": 88.34, "elapsed_time": "16:48:30", "remaining_time": "2:13:10"} +{"current_steps": 6240, "total_steps": 7064, "loss": 0.7745, "reward": null, "learning_rate": 1.6639442609176409e-06, "epoch": 1.77, "percentage": 88.34, "elapsed_time": "16:52:24", "remaining_time": "2:13:41"} +{"current_steps": 6250, "total_steps": 7064, "loss": 0.7888, "reward": null, "learning_rate": 1.6242906687893077e-06, "epoch": 1.77, "percentage": 88.48, "elapsed_time": "16:50:09", "remaining_time": "2:11:33"} +{"current_steps": 6250, "total_steps": 7064, "loss": 0.7888, "reward": null, "learning_rate": 1.6242906687893077e-06, "epoch": 1.77, "percentage": 88.48, "elapsed_time": "16:54:04", "remaining_time": "2:12:04"} +{"current_steps": 6250, "total_steps": 7064, "loss": 0.7888, "reward": null, "learning_rate": 1.6242906687893077e-06, "epoch": 1.77, "percentage": 88.48, "elapsed_time": "16:50:11", "remaining_time": "2:11:34"} +{"current_steps": 6250, "total_steps": 7064, "loss": 0.7888, "reward": null, "learning_rate": 1.6242906687893077e-06, "epoch": 1.77, "percentage": 88.48, "elapsed_time": "16:50:10", "remaining_time": "2:11:33"} +{"current_steps": 6260, "total_steps": 7064, "loss": 0.7949, "reward": null, "learning_rate": 1.5850994177022265e-06, "epoch": 1.77, "percentage": 88.62, "elapsed_time": "16:51:49", "remaining_time": "2:09:57"} +{"current_steps": 6260, "total_steps": 7064, "loss": 0.7949, "reward": null, "learning_rate": 1.5850994177022265e-06, "epoch": 1.77, "percentage": 88.62, "elapsed_time": "16:55:42", "remaining_time": "2:10:27"} +{"current_steps": 6260, "total_steps": 7064, "loss": 0.7949, "reward": null, "learning_rate": 1.5850994177022265e-06, "epoch": 1.77, "percentage": 88.62, "elapsed_time": "16:51:48", "remaining_time": "2:09:57"} +{"current_steps": 6260, "total_steps": 7064, "loss": 0.7949, "reward": null, "learning_rate": 1.5850994177022265e-06, "epoch": 1.77, "percentage": 88.62, "elapsed_time": "16:51:49", "remaining_time": "2:09:57"} +{"current_steps": 6270, "total_steps": 7064, "loss": 0.7702, "reward": null, "learning_rate": 1.546371282808226e-06, "epoch": 1.78, "percentage": 88.76, "elapsed_time": "16:53:24", "remaining_time": "2:08:19"} +{"current_steps": 6270, "total_steps": 7064, "loss": 0.7702, "reward": null, "learning_rate": 1.546371282808226e-06, "epoch": 1.78, "percentage": 88.76, "elapsed_time": "16:57:19", "remaining_time": "2:08:49"} +{"current_steps": 6270, "total_steps": 7064, "loss": 0.7702, "reward": null, "learning_rate": 1.546371282808226e-06, "epoch": 1.78, "percentage": 88.76, "elapsed_time": "16:53:25", "remaining_time": "2:08:20"} +{"current_steps": 6270, "total_steps": 7064, "loss": 0.7702, "reward": null, "learning_rate": 1.546371282808226e-06, "epoch": 1.78, "percentage": 88.76, "elapsed_time": "16:53:26", "remaining_time": "2:08:20"} +{"current_steps": 6280, "total_steps": 7064, "loss": 0.7911, "reward": null, "learning_rate": 1.508107030099304e-06, "epoch": 1.78, "percentage": 88.9, "elapsed_time": "16:55:03", "remaining_time": "2:06:43"} +{"current_steps": 6280, "total_steps": 7064, "loss": 0.7911, "reward": null, "learning_rate": 1.508107030099304e-06, "epoch": 1.78, "percentage": 88.9, "elapsed_time": "16:55:05", "remaining_time": "2:06:43"} +{"current_steps": 6280, "total_steps": 7064, "loss": 0.7911, "reward": null, "learning_rate": 1.508107030099304e-06, "epoch": 1.78, "percentage": 88.9, "elapsed_time": "16:58:58", "remaining_time": "2:07:12"} +{"current_steps": 6280, "total_steps": 7064, "loss": 0.7911, "reward": null, "learning_rate": 1.508107030099304e-06, "epoch": 1.78, "percentage": 88.9, "elapsed_time": "16:55:04", "remaining_time": "2:06:43"} +{"current_steps": 6290, "total_steps": 7064, "loss": 0.7807, "reward": null, "learning_rate": 1.4703074163924718e-06, "epoch": 1.78, "percentage": 89.04, "elapsed_time": "17:00:34", "remaining_time": "2:05:35"} +{"current_steps": 6290, "total_steps": 7064, "loss": 0.7807, "reward": null, "learning_rate": 1.4703074163924718e-06, "epoch": 1.78, "percentage": 89.04, "elapsed_time": "16:56:40", "remaining_time": "2:05:06"} +{"current_steps": 6290, "total_steps": 7064, "loss": 0.7807, "reward": null, "learning_rate": 1.4703074163924718e-06, "epoch": 1.78, "percentage": 89.04, "elapsed_time": "16:56:41", "remaining_time": "2:05:06"} +{"current_steps": 6290, "total_steps": 7064, "loss": 0.7807, "reward": null, "learning_rate": 1.4703074163924718e-06, "epoch": 1.78, "percentage": 89.04, "elapsed_time": "16:56:40", "remaining_time": "2:05:06"} +{"current_steps": 6300, "total_steps": 7064, "loss": 0.7797, "reward": null, "learning_rate": 1.4329731893147792e-06, "epoch": 1.78, "percentage": 89.18, "elapsed_time": "16:58:16", "remaining_time": "2:03:29"} +{"current_steps": 6300, "total_steps": 7064, "loss": 0.7797, "reward": null, "learning_rate": 1.4329731893147792e-06, "epoch": 1.78, "percentage": 89.18, "elapsed_time": "17:02:10", "remaining_time": "2:03:57"} +{"current_steps": 6300, "total_steps": 7064, "loss": 0.7797, "reward": null, "learning_rate": 1.4329731893147792e-06, "epoch": 1.78, "percentage": 89.18, "elapsed_time": "16:58:17", "remaining_time": "2:03:29"} +{"current_steps": 6300, "total_steps": 7064, "loss": 0.7797, "reward": null, "learning_rate": 1.4329731893147792e-06, "epoch": 1.78, "percentage": 89.18, "elapsed_time": "16:58:15", "remaining_time": "2:03:29"} +{"current_steps": 6310, "total_steps": 7064, "loss": 0.7899, "reward": null, "learning_rate": 1.396105087288549e-06, "epoch": 1.79, "percentage": 89.33, "elapsed_time": "16:59:53", "remaining_time": "2:01:52"} +{"current_steps": 6310, "total_steps": 7064, "loss": 0.7899, "reward": null, "learning_rate": 1.396105087288549e-06, "epoch": 1.79, "percentage": 89.33, "elapsed_time": "16:59:54", "remaining_time": "2:01:52"} +{"current_steps": 6310, "total_steps": 7064, "loss": 0.7899, "reward": null, "learning_rate": 1.396105087288549e-06, "epoch": 1.79, "percentage": 89.33, "elapsed_time": "16:59:55", "remaining_time": "2:01:52"} +{"current_steps": 6310, "total_steps": 7064, "loss": 0.7899, "reward": null, "learning_rate": 1.396105087288549e-06, "epoch": 1.79, "percentage": 89.33, "elapsed_time": "17:03:48", "remaining_time": "2:02:20"} +{"current_steps": 6320, "total_steps": 7064, "loss": 0.7755, "reward": null, "learning_rate": 1.3597038395167516e-06, "epoch": 1.79, "percentage": 89.47, "elapsed_time": "17:01:30", "remaining_time": "2:00:15"} +{"current_steps": 6320, "total_steps": 7064, "loss": 0.7755, "reward": null, "learning_rate": 1.3597038395167516e-06, "epoch": 1.79, "percentage": 89.47, "elapsed_time": "17:05:24", "remaining_time": "2:00:42"} +{"current_steps": 6320, "total_steps": 7064, "loss": 0.7755, "reward": null, "learning_rate": 1.3597038395167516e-06, "epoch": 1.79, "percentage": 89.47, "elapsed_time": "17:01:31", "remaining_time": "2:00:15"} +{"current_steps": 6320, "total_steps": 7064, "loss": 0.7755, "reward": null, "learning_rate": 1.3597038395167516e-06, "epoch": 1.79, "percentage": 89.47, "elapsed_time": "17:01:31", "remaining_time": "2:00:15"} +{"current_steps": 6330, "total_steps": 7064, "loss": 0.7765, "reward": null, "learning_rate": 1.3237701659685854e-06, "epoch": 1.79, "percentage": 89.61, "elapsed_time": "17:03:04", "remaining_time": "1:58:37"} +{"current_steps": 6330, "total_steps": 7064, "loss": 0.7765, "reward": null, "learning_rate": 1.3237701659685854e-06, "epoch": 1.79, "percentage": 89.61, "elapsed_time": "17:06:58", "remaining_time": "1:59:05"} +{"current_steps": 6330, "total_steps": 7064, "loss": 0.7765, "reward": null, "learning_rate": 1.3237701659685854e-06, "epoch": 1.79, "percentage": 89.61, "elapsed_time": "17:03:05", "remaining_time": "1:58:38"} +{"current_steps": 6330, "total_steps": 7064, "loss": 0.7765, "reward": null, "learning_rate": 1.3237701659685854e-06, "epoch": 1.79, "percentage": 89.61, "elapsed_time": "17:03:03", "remaining_time": "1:58:37"} +{"current_steps": 6340, "total_steps": 7064, "loss": 0.7679, "reward": null, "learning_rate": 1.28830477736524e-06, "epoch": 1.8, "percentage": 89.75, "elapsed_time": "17:08:32", "remaining_time": "1:57:27"} +{"current_steps": 6340, "total_steps": 7064, "loss": 0.7679, "reward": null, "learning_rate": 1.28830477736524e-06, "epoch": 1.8, "percentage": 89.75, "elapsed_time": "17:04:39", "remaining_time": "1:57:00"} +{"current_steps": 6340, "total_steps": 7064, "loss": 0.7679, "reward": null, "learning_rate": 1.28830477736524e-06, "epoch": 1.8, "percentage": 89.75, "elapsed_time": "17:04:38", "remaining_time": "1:57:00"} +{"current_steps": 6340, "total_steps": 7064, "loss": 0.7679, "reward": null, "learning_rate": 1.28830477736524e-06, "epoch": 1.8, "percentage": 89.75, "elapsed_time": "17:04:37", "remaining_time": "1:57:00"} +{"current_steps": 6350, "total_steps": 7064, "loss": 0.7881, "reward": null, "learning_rate": 1.253308375165857e-06, "epoch": 1.8, "percentage": 89.89, "elapsed_time": "17:06:17", "remaining_time": "1:55:23"} +{"current_steps": 6350, "total_steps": 7064, "loss": 0.7881, "reward": null, "learning_rate": 1.253308375165857e-06, "epoch": 1.8, "percentage": 89.89, "elapsed_time": "17:10:11", "remaining_time": "1:55:50"} +{"current_steps": 6350, "total_steps": 7064, "loss": 0.7881, "reward": null, "learning_rate": 1.253308375165857e-06, "epoch": 1.8, "percentage": 89.89, "elapsed_time": "17:06:17", "remaining_time": "1:55:23"} +{"current_steps": 6350, "total_steps": 7064, "loss": 0.7881, "reward": null, "learning_rate": 1.253308375165857e-06, "epoch": 1.8, "percentage": 89.89, "elapsed_time": "17:06:18", "remaining_time": "1:55:23"} +{"current_steps": 6360, "total_steps": 7064, "loss": 0.78, "reward": null, "learning_rate": 1.2187816515536105e-06, "epoch": 1.8, "percentage": 90.03, "elapsed_time": "17:07:54", "remaining_time": "1:53:46"} +{"current_steps": 6360, "total_steps": 7064, "loss": 0.78, "reward": null, "learning_rate": 1.2187816515536105e-06, "epoch": 1.8, "percentage": 90.03, "elapsed_time": "17:11:48", "remaining_time": "1:54:12"} +{"current_steps": 6360, "total_steps": 7064, "loss": 0.78, "reward": null, "learning_rate": 1.2187816515536105e-06, "epoch": 1.8, "percentage": 90.03, "elapsed_time": "17:07:55", "remaining_time": "1:53:46"} +{"current_steps": 6360, "total_steps": 7064, "loss": 0.78, "reward": null, "learning_rate": 1.2187816515536105e-06, "epoch": 1.8, "percentage": 90.03, "elapsed_time": "17:07:54", "remaining_time": "1:53:46"} +{"current_steps": 6370, "total_steps": 7064, "loss": 0.7893, "reward": null, "learning_rate": 1.184725289422073e-06, "epoch": 1.8, "percentage": 90.18, "elapsed_time": "17:09:33", "remaining_time": "1:52:10"} +{"current_steps": 6370, "total_steps": 7064, "loss": 0.7893, "reward": null, "learning_rate": 1.184725289422073e-06, "epoch": 1.8, "percentage": 90.18, "elapsed_time": "17:13:27", "remaining_time": "1:52:35"} +{"current_steps": 6370, "total_steps": 7064, "loss": 0.7893, "reward": null, "learning_rate": 1.184725289422073e-06, "epoch": 1.8, "percentage": 90.18, "elapsed_time": "17:09:32", "remaining_time": "1:52:10"} +{"current_steps": 6370, "total_steps": 7064, "loss": 0.7893, "reward": null, "learning_rate": 1.184725289422073e-06, "epoch": 1.8, "percentage": 90.18, "elapsed_time": "17:09:34", "remaining_time": "1:52:10"} +{"current_steps": 6380, "total_steps": 7064, "loss": 0.7799, "reward": null, "learning_rate": 1.151139962361658e-06, "epoch": 1.81, "percentage": 90.32, "elapsed_time": "17:11:08", "remaining_time": "1:50:32"} +{"current_steps": 6380, "total_steps": 7064, "loss": 0.7799, "reward": null, "learning_rate": 1.151139962361658e-06, "epoch": 1.81, "percentage": 90.32, "elapsed_time": "17:15:03", "remaining_time": "1:50:58"} +{"current_steps": 6380, "total_steps": 7064, "loss": 0.7799, "reward": null, "learning_rate": 1.151139962361658e-06, "epoch": 1.81, "percentage": 90.32, "elapsed_time": "17:11:10", "remaining_time": "1:50:33"} +{"current_steps": 6380, "total_steps": 7064, "loss": 0.7799, "reward": null, "learning_rate": 1.151139962361658e-06, "epoch": 1.81, "percentage": 90.32, "elapsed_time": "17:11:09", "remaining_time": "1:50:33"} +{"current_steps": 6390, "total_steps": 7064, "loss": 0.7734, "reward": null, "learning_rate": 1.1180263346463327e-06, "epoch": 1.81, "percentage": 90.46, "elapsed_time": "17:16:45", "remaining_time": "1:49:21"} +{"current_steps": 6390, "total_steps": 7064, "loss": 0.7734, "reward": null, "learning_rate": 1.1180263346463327e-06, "epoch": 1.81, "percentage": 90.46, "elapsed_time": "17:12:50", "remaining_time": "1:48:56"} +{"current_steps": 6390, "total_steps": 7064, "loss": 0.7734, "reward": null, "learning_rate": 1.1180263346463327e-06, "epoch": 1.81, "percentage": 90.46, "elapsed_time": "17:12:52", "remaining_time": "1:48:56"} +{"current_steps": 6390, "total_steps": 7064, "loss": 0.7734, "reward": null, "learning_rate": 1.1180263346463327e-06, "epoch": 1.81, "percentage": 90.46, "elapsed_time": "17:12:51", "remaining_time": "1:48:56"} +{"current_steps": 6400, "total_steps": 7064, "loss": 0.7719, "reward": null, "learning_rate": 1.0853850612204646e-06, "epoch": 1.81, "percentage": 90.6, "elapsed_time": "17:14:31", "remaining_time": "1:47:19"} +{"current_steps": 6400, "total_steps": 7064, "loss": 0.7719, "reward": null, "learning_rate": 1.0853850612204646e-06, "epoch": 1.81, "percentage": 90.6, "elapsed_time": "17:18:24", "remaining_time": "1:47:44"} +{"current_steps": 6400, "total_steps": 7064, "loss": 0.7719, "reward": null, "learning_rate": 1.0853850612204646e-06, "epoch": 1.81, "percentage": 90.6, "elapsed_time": "17:14:29", "remaining_time": "1:47:19"} +{"current_steps": 6400, "total_steps": 7064, "loss": 0.7719, "reward": null, "learning_rate": 1.0853850612204646e-06, "epoch": 1.81, "percentage": 90.6, "elapsed_time": "17:14:30", "remaining_time": "1:47:19"} +{"current_steps": 6410, "total_steps": 7064, "loss": 0.7752, "reward": null, "learning_rate": 1.053216787685865e-06, "epoch": 1.81, "percentage": 90.74, "elapsed_time": "17:16:05", "remaining_time": "1:45:42"} +{"current_steps": 6410, "total_steps": 7064, "loss": 0.7752, "reward": null, "learning_rate": 1.053216787685865e-06, "epoch": 1.81, "percentage": 90.74, "elapsed_time": "17:20:00", "remaining_time": "1:46:06"} +{"current_steps": 6410, "total_steps": 7064, "loss": 0.7752, "reward": null, "learning_rate": 1.053216787685865e-06, "epoch": 1.81, "percentage": 90.74, "elapsed_time": "17:16:07", "remaining_time": "1:45:42"} +{"current_steps": 6410, "total_steps": 7064, "loss": 0.7752, "reward": null, "learning_rate": 1.053216787685865e-06, "epoch": 1.81, "percentage": 90.74, "elapsed_time": "17:16:06", "remaining_time": "1:45:42"} +{"current_steps": 6420, "total_steps": 7064, "loss": 0.7758, "reward": null, "learning_rate": 1.0215221502890254e-06, "epoch": 1.82, "percentage": 90.88, "elapsed_time": "17:17:48", "remaining_time": "1:44:06"} +{"current_steps": 6420, "total_steps": 7064, "loss": 0.7758, "reward": null, "learning_rate": 1.0215221502890254e-06, "epoch": 1.82, "percentage": 90.88, "elapsed_time": "17:21:42", "remaining_time": "1:44:29"} +{"current_steps": 6420, "total_steps": 7064, "loss": 0.7758, "reward": null, "learning_rate": 1.0215221502890254e-06, "epoch": 1.82, "percentage": 90.88, "elapsed_time": "17:17:49", "remaining_time": "1:44:06"} +{"current_steps": 6420, "total_steps": 7064, "loss": 0.7758, "reward": null, "learning_rate": 1.0215221502890254e-06, "epoch": 1.82, "percentage": 90.88, "elapsed_time": "17:17:47", "remaining_time": "1:44:06"} +{"current_steps": 6430, "total_steps": 7064, "loss": 0.7696, "reward": null, "learning_rate": 9.903017759085365e-07, "epoch": 1.82, "percentage": 91.02, "elapsed_time": "17:19:20", "remaining_time": "1:42:28"} +{"current_steps": 6430, "total_steps": 7064, "loss": 0.7696, "reward": null, "learning_rate": 9.903017759085365e-07, "epoch": 1.82, "percentage": 91.02, "elapsed_time": "17:23:15", "remaining_time": "1:42:51"} +{"current_steps": 6430, "total_steps": 7064, "loss": 0.7696, "reward": null, "learning_rate": 9.903017759085365e-07, "epoch": 1.82, "percentage": 91.02, "elapsed_time": "17:19:22", "remaining_time": "1:42:28"} +{"current_steps": 6430, "total_steps": 7064, "loss": 0.7696, "reward": null, "learning_rate": 9.903017759085365e-07, "epoch": 1.82, "percentage": 91.02, "elapsed_time": "17:19:21", "remaining_time": "1:42:28"} +{"current_steps": 6440, "total_steps": 7064, "loss": 0.7828, "reward": null, "learning_rate": 9.595562820426758e-07, "epoch": 1.82, "percentage": 91.17, "elapsed_time": "17:20:57", "remaining_time": "1:40:51"} +{"current_steps": 6440, "total_steps": 7064, "loss": 0.7828, "reward": null, "learning_rate": 9.595562820426758e-07, "epoch": 1.82, "percentage": 91.17, "elapsed_time": "17:24:52", "remaining_time": "1:41:14"} +{"current_steps": 6440, "total_steps": 7064, "loss": 0.7828, "reward": null, "learning_rate": 9.595562820426758e-07, "epoch": 1.82, "percentage": 91.17, "elapsed_time": "17:20:59", "remaining_time": "1:40:51"} +{"current_steps": 6440, "total_steps": 7064, "loss": 0.7828, "reward": null, "learning_rate": 9.595562820426758e-07, "epoch": 1.82, "percentage": 91.17, "elapsed_time": "17:20:58", "remaining_time": "1:40:51"} +{"current_steps": 6450, "total_steps": 7064, "loss": 0.7895, "reward": null, "learning_rate": 9.292862767972199e-07, "epoch": 1.83, "percentage": 91.31, "elapsed_time": "17:22:40", "remaining_time": "1:39:15"} +{"current_steps": 6450, "total_steps": 7064, "loss": 0.7895, "reward": null, "learning_rate": 9.292862767972199e-07, "epoch": 1.83, "percentage": 91.31, "elapsed_time": "17:26:33", "remaining_time": "1:39:37"} +{"current_steps": 6450, "total_steps": 7064, "loss": 0.7895, "reward": null, "learning_rate": 9.292862767972199e-07, "epoch": 1.83, "percentage": 91.31, "elapsed_time": "17:22:39", "remaining_time": "1:39:15"} +{"current_steps": 6450, "total_steps": 7064, "loss": 0.7895, "reward": null, "learning_rate": 9.292862767972199e-07, "epoch": 1.83, "percentage": 91.31, "elapsed_time": "17:22:38", "remaining_time": "1:39:15"} +{"current_steps": 6460, "total_steps": 7064, "loss": 0.7845, "reward": null, "learning_rate": 8.994923588733856e-07, "epoch": 1.83, "percentage": 91.45, "elapsed_time": "17:24:14", "remaining_time": "1:37:38"} +{"current_steps": 6460, "total_steps": 7064, "loss": 0.7845, "reward": null, "learning_rate": 8.994923588733856e-07, "epoch": 1.83, "percentage": 91.45, "elapsed_time": "17:24:15", "remaining_time": "1:37:38"} +{"current_steps": 6460, "total_steps": 7064, "loss": 0.7845, "reward": null, "learning_rate": 8.994923588733856e-07, "epoch": 1.83, "percentage": 91.45, "elapsed_time": "17:28:08", "remaining_time": "1:37:59"} +{"current_steps": 6460, "total_steps": 7064, "loss": 0.7845, "reward": null, "learning_rate": 8.994923588733856e-07, "epoch": 1.83, "percentage": 91.45, "elapsed_time": "17:24:13", "remaining_time": "1:37:38"} +{"current_steps": 6470, "total_steps": 7064, "loss": 0.771, "reward": null, "learning_rate": 8.701751175560102e-07, "epoch": 1.83, "percentage": 91.59, "elapsed_time": "17:25:50", "remaining_time": "1:36:00"} +{"current_steps": 6470, "total_steps": 7064, "loss": 0.771, "reward": null, "learning_rate": 8.701751175560102e-07, "epoch": 1.83, "percentage": 91.59, "elapsed_time": "17:29:44", "remaining_time": "1:36:22"} +{"current_steps": 6470, "total_steps": 7064, "loss": 0.771, "reward": null, "learning_rate": 8.701751175560102e-07, "epoch": 1.83, "percentage": 91.59, "elapsed_time": "17:25:50", "remaining_time": "1:36:01"} +{"current_steps": 6470, "total_steps": 7064, "loss": 0.771, "reward": null, "learning_rate": 8.701751175560102e-07, "epoch": 1.83, "percentage": 91.59, "elapsed_time": "17:25:51", "remaining_time": "1:36:01"} +{"current_steps": 6480, "total_steps": 7064, "loss": 0.7677, "reward": null, "learning_rate": 8.41335132701887e-07, "epoch": 1.83, "percentage": 91.73, "elapsed_time": "17:27:29", "remaining_time": "1:34:24"} +{"current_steps": 6480, "total_steps": 7064, "loss": 0.7677, "reward": null, "learning_rate": 8.41335132701887e-07, "epoch": 1.83, "percentage": 91.73, "elapsed_time": "17:31:24", "remaining_time": "1:34:45"} +{"current_steps": 6480, "total_steps": 7064, "loss": 0.7677, "reward": null, "learning_rate": 8.41335132701887e-07, "epoch": 1.83, "percentage": 91.73, "elapsed_time": "17:27:31", "remaining_time": "1:34:24"} +{"current_steps": 6480, "total_steps": 7064, "loss": 0.7677, "reward": null, "learning_rate": 8.41335132701887e-07, "epoch": 1.83, "percentage": 91.73, "elapsed_time": "17:27:30", "remaining_time": "1:34:24"} +{"current_steps": 6490, "total_steps": 7064, "loss": 0.786, "reward": null, "learning_rate": 8.129729747283016e-07, "epoch": 1.84, "percentage": 91.87, "elapsed_time": "17:29:05", "remaining_time": "1:32:47"} +{"current_steps": 6490, "total_steps": 7064, "loss": 0.786, "reward": null, "learning_rate": 8.129729747283016e-07, "epoch": 1.84, "percentage": 91.87, "elapsed_time": "17:32:58", "remaining_time": "1:33:07"} +{"current_steps": 6490, "total_steps": 7064, "loss": 0.786, "reward": null, "learning_rate": 8.129729747283016e-07, "epoch": 1.84, "percentage": 91.87, "elapsed_time": "17:29:04", "remaining_time": "1:32:47"} +{"current_steps": 6490, "total_steps": 7064, "loss": 0.786, "reward": null, "learning_rate": 8.129729747283016e-07, "epoch": 1.84, "percentage": 91.87, "elapsed_time": "17:29:04", "remaining_time": "1:32:47"} +{"current_steps": 6500, "total_steps": 7064, "loss": 0.7883, "reward": null, "learning_rate": 7.85089204601741e-07, "epoch": 1.84, "percentage": 92.02, "elapsed_time": "17:30:43", "remaining_time": "1:31:10"} +{"current_steps": 6500, "total_steps": 7064, "loss": 0.7883, "reward": null, "learning_rate": 7.85089204601741e-07, "epoch": 1.84, "percentage": 92.02, "elapsed_time": "17:34:38", "remaining_time": "1:31:30"} +{"current_steps": 6500, "total_steps": 7064, "loss": 0.7883, "reward": null, "learning_rate": 7.85089204601741e-07, "epoch": 1.84, "percentage": 92.02, "elapsed_time": "17:30:45", "remaining_time": "1:31:10"} +{"current_steps": 6500, "total_steps": 7064, "loss": 0.7883, "reward": null, "learning_rate": 7.85089204601741e-07, "epoch": 1.84, "percentage": 92.02, "elapsed_time": "17:30:44", "remaining_time": "1:31:10"} +{"current_steps": 6510, "total_steps": 7064, "loss": 0.7845, "reward": null, "learning_rate": 7.576843738268113e-07, "epoch": 1.84, "percentage": 92.16, "elapsed_time": "17:36:15", "remaining_time": "1:29:53"} +{"current_steps": 6510, "total_steps": 7064, "loss": 0.7845, "reward": null, "learning_rate": 7.576843738268113e-07, "epoch": 1.84, "percentage": 92.16, "elapsed_time": "17:32:22", "remaining_time": "1:29:33"} +{"current_steps": 6510, "total_steps": 7064, "loss": 0.7845, "reward": null, "learning_rate": 7.576843738268113e-07, "epoch": 1.84, "percentage": 92.16, "elapsed_time": "17:32:22", "remaining_time": "1:29:33"} +{"current_steps": 6510, "total_steps": 7064, "loss": 0.7845, "reward": null, "learning_rate": 7.576843738268113e-07, "epoch": 1.84, "percentage": 92.16, "elapsed_time": "17:32:21", "remaining_time": "1:29:33"} +{"current_steps": 6520, "total_steps": 7064, "loss": 0.7837, "reward": null, "learning_rate": 7.307590244353263e-07, "epoch": 1.85, "percentage": 92.3, "elapsed_time": "17:33:58", "remaining_time": "1:27:56"} +{"current_steps": 6520, "total_steps": 7064, "loss": 0.7837, "reward": null, "learning_rate": 7.307590244353263e-07, "epoch": 1.85, "percentage": 92.3, "elapsed_time": "17:37:52", "remaining_time": "1:28:15"} +{"current_steps": 6520, "total_steps": 7064, "loss": 0.7837, "reward": null, "learning_rate": 7.307590244353263e-07, "epoch": 1.85, "percentage": 92.3, "elapsed_time": "17:33:59", "remaining_time": "1:27:56"} +{"current_steps": 6520, "total_steps": 7064, "loss": 0.7837, "reward": null, "learning_rate": 7.307590244353263e-07, "epoch": 1.85, "percentage": 92.3, "elapsed_time": "17:33:57", "remaining_time": "1:27:56"} +{"current_steps": 6530, "total_steps": 7064, "loss": 0.7697, "reward": null, "learning_rate": 7.043136889755691e-07, "epoch": 1.85, "percentage": 92.44, "elapsed_time": "17:35:33", "remaining_time": "1:26:19"} +{"current_steps": 6530, "total_steps": 7064, "loss": 0.7697, "reward": null, "learning_rate": 7.043136889755691e-07, "epoch": 1.85, "percentage": 92.44, "elapsed_time": "17:39:25", "remaining_time": "1:26:38"} +{"current_steps": 6530, "total_steps": 7064, "loss": 0.7697, "reward": null, "learning_rate": 7.043136889755691e-07, "epoch": 1.85, "percentage": 92.44, "elapsed_time": "17:35:32", "remaining_time": "1:26:19"} +{"current_steps": 6530, "total_steps": 7064, "loss": 0.7697, "reward": null, "learning_rate": 7.043136889755691e-07, "epoch": 1.85, "percentage": 92.44, "elapsed_time": "17:35:31", "remaining_time": "1:26:19"} +{"current_steps": 6540, "total_steps": 7064, "loss": 0.782, "reward": null, "learning_rate": 6.783488905017871e-07, "epoch": 1.85, "percentage": 92.58, "elapsed_time": "17:37:08", "remaining_time": "1:24:42"} +{"current_steps": 6540, "total_steps": 7064, "loss": 0.782, "reward": null, "learning_rate": 6.783488905017871e-07, "epoch": 1.85, "percentage": 92.58, "elapsed_time": "17:41:03", "remaining_time": "1:25:00"} +{"current_steps": 6540, "total_steps": 7064, "loss": 0.782, "reward": null, "learning_rate": 6.783488905017871e-07, "epoch": 1.85, "percentage": 92.58, "elapsed_time": "17:37:10", "remaining_time": "1:24:42"} +{"current_steps": 6540, "total_steps": 7064, "loss": 0.782, "reward": null, "learning_rate": 6.783488905017871e-07, "epoch": 1.85, "percentage": 92.58, "elapsed_time": "17:37:09", "remaining_time": "1:24:42"} +{"current_steps": 6550, "total_steps": 7064, "loss": 0.7923, "reward": null, "learning_rate": 6.528651425638272e-07, "epoch": 1.85, "percentage": 92.72, "elapsed_time": "17:38:46", "remaining_time": "1:23:05"} +{"current_steps": 6550, "total_steps": 7064, "loss": 0.7923, "reward": null, "learning_rate": 6.528651425638272e-07, "epoch": 1.85, "percentage": 92.72, "elapsed_time": "17:42:40", "remaining_time": "1:23:23"} +{"current_steps": 6550, "total_steps": 7064, "loss": 0.7923, "reward": null, "learning_rate": 6.528651425638272e-07, "epoch": 1.85, "percentage": 92.72, "elapsed_time": "17:38:47", "remaining_time": "1:23:05"} +{"current_steps": 6550, "total_steps": 7064, "loss": 0.7923, "reward": null, "learning_rate": 6.528651425638272e-07, "epoch": 1.85, "percentage": 92.72, "elapsed_time": "17:38:47", "remaining_time": "1:23:05"} +{"current_steps": 6560, "total_steps": 7064, "loss": 0.7745, "reward": null, "learning_rate": 6.278629491969862e-07, "epoch": 1.86, "percentage": 92.87, "elapsed_time": "17:40:22", "remaining_time": "1:21:28"} +{"current_steps": 6560, "total_steps": 7064, "loss": 0.7745, "reward": null, "learning_rate": 6.278629491969862e-07, "epoch": 1.86, "percentage": 92.87, "elapsed_time": "17:40:22", "remaining_time": "1:21:28"} +{"current_steps": 6560, "total_steps": 7064, "loss": 0.7745, "reward": null, "learning_rate": 6.278629491969862e-07, "epoch": 1.86, "percentage": 92.87, "elapsed_time": "17:44:16", "remaining_time": "1:21:46"} +{"current_steps": 6560, "total_steps": 7064, "loss": 0.7745, "reward": null, "learning_rate": 6.278629491969862e-07, "epoch": 1.86, "percentage": 92.87, "elapsed_time": "17:40:23", "remaining_time": "1:21:28"} +{"current_steps": 6570, "total_steps": 7064, "loss": 0.7882, "reward": null, "learning_rate": 6.033428049120326e-07, "epoch": 1.86, "percentage": 93.01, "elapsed_time": "17:42:00", "remaining_time": "1:19:51"} +{"current_steps": 6570, "total_steps": 7064, "loss": 0.7882, "reward": null, "learning_rate": 6.033428049120326e-07, "epoch": 1.86, "percentage": 93.01, "elapsed_time": "17:42:01", "remaining_time": "1:19:51"} +{"current_steps": 6570, "total_steps": 7064, "loss": 0.7882, "reward": null, "learning_rate": 6.033428049120326e-07, "epoch": 1.86, "percentage": 93.01, "elapsed_time": "17:42:01", "remaining_time": "1:19:51"} +{"current_steps": 6570, "total_steps": 7064, "loss": 0.7882, "reward": null, "learning_rate": 6.033428049120326e-07, "epoch": 1.86, "percentage": 93.01, "elapsed_time": "17:45:54", "remaining_time": "1:20:08"} +{"current_steps": 6580, "total_steps": 7064, "loss": 0.7655, "reward": null, "learning_rate": 5.793051946854422e-07, "epoch": 1.86, "percentage": 93.15, "elapsed_time": "17:43:37", "remaining_time": "1:18:14"} +{"current_steps": 6580, "total_steps": 7064, "loss": 0.7655, "reward": null, "learning_rate": 5.793051946854422e-07, "epoch": 1.86, "percentage": 93.15, "elapsed_time": "17:43:39", "remaining_time": "1:18:14"} +{"current_steps": 6580, "total_steps": 7064, "loss": 0.7655, "reward": null, "learning_rate": 5.793051946854422e-07, "epoch": 1.86, "percentage": 93.15, "elapsed_time": "17:43:38", "remaining_time": "1:18:14"} +{"current_steps": 6580, "total_steps": 7064, "loss": 0.7655, "reward": null, "learning_rate": 5.793051946854422e-07, "epoch": 1.86, "percentage": 93.15, "elapsed_time": "17:47:32", "remaining_time": "1:18:31"} +{"current_steps": 6590, "total_steps": 7064, "loss": 0.7864, "reward": null, "learning_rate": 5.557505939497915e-07, "epoch": 1.87, "percentage": 93.29, "elapsed_time": "17:45:15", "remaining_time": "1:16:37"} +{"current_steps": 6590, "total_steps": 7064, "loss": 0.7864, "reward": null, "learning_rate": 5.557505939497915e-07, "epoch": 1.87, "percentage": 93.29, "elapsed_time": "17:45:13", "remaining_time": "1:16:37"} +{"current_steps": 6590, "total_steps": 7064, "loss": 0.7864, "reward": null, "learning_rate": 5.557505939497915e-07, "epoch": 1.87, "percentage": 93.29, "elapsed_time": "17:49:08", "remaining_time": "1:16:54"} +{"current_steps": 6590, "total_steps": 7064, "loss": 0.7864, "reward": null, "learning_rate": 5.557505939497915e-07, "epoch": 1.87, "percentage": 93.29, "elapsed_time": "17:45:14", "remaining_time": "1:16:37"} +{"current_steps": 6600, "total_steps": 7064, "loss": 0.7793, "reward": null, "learning_rate": 5.326794685843655e-07, "epoch": 1.87, "percentage": 93.43, "elapsed_time": "17:46:53", "remaining_time": "1:15:00"} +{"current_steps": 6600, "total_steps": 7064, "loss": 0.7793, "reward": null, "learning_rate": 5.326794685843655e-07, "epoch": 1.87, "percentage": 93.43, "elapsed_time": "17:46:55", "remaining_time": "1:15:00"} +{"current_steps": 6600, "total_steps": 7064, "loss": 0.7793, "reward": null, "learning_rate": 5.326794685843655e-07, "epoch": 1.87, "percentage": 93.43, "elapsed_time": "17:46:54", "remaining_time": "1:15:00"} +{"current_steps": 6600, "total_steps": 7064, "loss": 0.7793, "reward": null, "learning_rate": 5.326794685843655e-07, "epoch": 1.87, "percentage": 93.43, "elapsed_time": "17:50:48", "remaining_time": "1:15:16"} +{"current_steps": 6610, "total_steps": 7064, "loss": 0.787, "reward": null, "learning_rate": 5.100922749059239e-07, "epoch": 1.87, "percentage": 93.57, "elapsed_time": "17:48:27", "remaining_time": "1:13:23"} +{"current_steps": 6610, "total_steps": 7064, "loss": 0.787, "reward": null, "learning_rate": 5.100922749059239e-07, "epoch": 1.87, "percentage": 93.57, "elapsed_time": "17:48:28", "remaining_time": "1:13:23"} +{"current_steps": 6610, "total_steps": 7064, "loss": 0.787, "reward": null, "learning_rate": 5.100922749059239e-07, "epoch": 1.87, "percentage": 93.57, "elapsed_time": "17:48:26", "remaining_time": "1:13:23"} +{"current_steps": 6610, "total_steps": 7064, "loss": 0.787, "reward": null, "learning_rate": 5.100922749059239e-07, "epoch": 1.87, "percentage": 93.57, "elapsed_time": "17:52:21", "remaining_time": "1:13:39"} +{"current_steps": 6620, "total_steps": 7064, "loss": 0.7651, "reward": null, "learning_rate": 4.879894596597018e-07, "epoch": 1.87, "percentage": 93.71, "elapsed_time": "17:50:05", "remaining_time": "1:11:46"} +{"current_steps": 6620, "total_steps": 7064, "loss": 0.7651, "reward": null, "learning_rate": 4.879894596597018e-07, "epoch": 1.87, "percentage": 93.71, "elapsed_time": "17:53:59", "remaining_time": "1:12:01"} +{"current_steps": 6620, "total_steps": 7064, "loss": 0.7651, "reward": null, "learning_rate": 4.879894596597018e-07, "epoch": 1.87, "percentage": 93.71, "elapsed_time": "17:50:06", "remaining_time": "1:11:46"} +{"current_steps": 6620, "total_steps": 7064, "loss": 0.7651, "reward": null, "learning_rate": 4.879894596597018e-07, "epoch": 1.87, "percentage": 93.71, "elapsed_time": "17:50:06", "remaining_time": "1:11:46"} +{"current_steps": 6630, "total_steps": 7064, "loss": 0.7677, "reward": null, "learning_rate": 4.663714600105534e-07, "epoch": 1.88, "percentage": 93.86, "elapsed_time": "17:51:42", "remaining_time": "1:10:09"} +{"current_steps": 6630, "total_steps": 7064, "loss": 0.7677, "reward": null, "learning_rate": 4.663714600105534e-07, "epoch": 1.88, "percentage": 93.86, "elapsed_time": "17:55:36", "remaining_time": "1:10:24"} +{"current_steps": 6630, "total_steps": 7064, "loss": 0.7677, "reward": null, "learning_rate": 4.663714600105534e-07, "epoch": 1.88, "percentage": 93.86, "elapsed_time": "17:51:43", "remaining_time": "1:10:09"} +{"current_steps": 6630, "total_steps": 7064, "loss": 0.7677, "reward": null, "learning_rate": 4.663714600105534e-07, "epoch": 1.88, "percentage": 93.86, "elapsed_time": "17:51:43", "remaining_time": "1:10:09"} +{"current_steps": 6640, "total_steps": 7064, "loss": 0.7847, "reward": null, "learning_rate": 4.452387035343203e-07, "epoch": 1.88, "percentage": 94.0, "elapsed_time": "17:53:19", "remaining_time": "1:08:32"} +{"current_steps": 6640, "total_steps": 7064, "loss": 0.7847, "reward": null, "learning_rate": 4.452387035343203e-07, "epoch": 1.88, "percentage": 94.0, "elapsed_time": "17:53:21", "remaining_time": "1:08:32"} +{"current_steps": 6640, "total_steps": 7064, "loss": 0.7847, "reward": null, "learning_rate": 4.452387035343203e-07, "epoch": 1.88, "percentage": 94.0, "elapsed_time": "17:53:20", "remaining_time": "1:08:32"} +{"current_steps": 6640, "total_steps": 7064, "loss": 0.7847, "reward": null, "learning_rate": 4.452387035343203e-07, "epoch": 1.88, "percentage": 94.0, "elapsed_time": "17:57:14", "remaining_time": "1:08:47"} +{"current_steps": 6650, "total_steps": 7064, "loss": 0.7849, "reward": null, "learning_rate": 4.2459160820935153e-07, "epoch": 1.88, "percentage": 94.14, "elapsed_time": "17:54:54", "remaining_time": "1:06:55"} +{"current_steps": 6650, "total_steps": 7064, "loss": 0.7849, "reward": null, "learning_rate": 4.2459160820935153e-07, "epoch": 1.88, "percentage": 94.14, "elapsed_time": "17:58:48", "remaining_time": "1:07:09"} +{"current_steps": 6650, "total_steps": 7064, "loss": 0.7849, "reward": null, "learning_rate": 4.2459160820935153e-07, "epoch": 1.88, "percentage": 94.14, "elapsed_time": "17:54:55", "remaining_time": "1:06:55"} +{"current_steps": 6650, "total_steps": 7064, "loss": 0.7849, "reward": null, "learning_rate": 4.2459160820935153e-07, "epoch": 1.88, "percentage": 94.14, "elapsed_time": "17:54:54", "remaining_time": "1:06:55"} +{"current_steps": 6660, "total_steps": 7064, "loss": 0.7688, "reward": null, "learning_rate": 4.044305824082717e-07, "epoch": 1.89, "percentage": 94.28, "elapsed_time": "17:56:29", "remaining_time": "1:05:18"} +{"current_steps": 6660, "total_steps": 7064, "loss": 0.7688, "reward": null, "learning_rate": 4.044305824082717e-07, "epoch": 1.89, "percentage": 94.28, "elapsed_time": "17:56:28", "remaining_time": "1:05:17"} +{"current_steps": 6660, "total_steps": 7064, "loss": 0.7688, "reward": null, "learning_rate": 4.044305824082717e-07, "epoch": 1.89, "percentage": 94.28, "elapsed_time": "17:56:27", "remaining_time": "1:05:17"} +{"current_steps": 6660, "total_steps": 7064, "loss": 0.7688, "reward": null, "learning_rate": 4.044305824082717e-07, "epoch": 1.89, "percentage": 94.28, "elapsed_time": "18:00:22", "remaining_time": "1:05:32"} +{"current_steps": 6670, "total_steps": 7064, "loss": 0.7796, "reward": null, "learning_rate": 3.84756024889868e-07, "epoch": 1.89, "percentage": 94.42, "elapsed_time": "17:58:04", "remaining_time": "1:03:40"} +{"current_steps": 6670, "total_steps": 7064, "loss": 0.7796, "reward": null, "learning_rate": 3.84756024889868e-07, "epoch": 1.89, "percentage": 94.42, "elapsed_time": "18:01:59", "remaining_time": "1:03:54"} +{"current_steps": 6670, "total_steps": 7064, "loss": 0.7796, "reward": null, "learning_rate": 3.84756024889868e-07, "epoch": 1.89, "percentage": 94.42, "elapsed_time": "17:58:05", "remaining_time": "1:03:41"} +{"current_steps": 6670, "total_steps": 7064, "loss": 0.7796, "reward": null, "learning_rate": 3.84756024889868e-07, "epoch": 1.89, "percentage": 94.42, "elapsed_time": "17:58:06", "remaining_time": "1:03:41"} +{"current_steps": 6680, "total_steps": 7064, "loss": 0.762, "reward": null, "learning_rate": 3.6556832479123504e-07, "epoch": 1.89, "percentage": 94.56, "elapsed_time": "17:59:46", "remaining_time": "1:02:04"} +{"current_steps": 6680, "total_steps": 7064, "loss": 0.762, "reward": null, "learning_rate": 3.6556832479123504e-07, "epoch": 1.89, "percentage": 94.56, "elapsed_time": "17:59:45", "remaining_time": "1:02:04"} +{"current_steps": 6680, "total_steps": 7064, "loss": 0.762, "reward": null, "learning_rate": 3.6556832479123504e-07, "epoch": 1.89, "percentage": 94.56, "elapsed_time": "18:03:40", "remaining_time": "1:02:17"} +{"current_steps": 6680, "total_steps": 7064, "loss": 0.762, "reward": null, "learning_rate": 3.6556832479123504e-07, "epoch": 1.89, "percentage": 94.56, "elapsed_time": "17:59:47", "remaining_time": "1:02:04"} +{"current_steps": 6690, "total_steps": 7064, "loss": 0.7947, "reward": null, "learning_rate": 3.468678616200427e-07, "epoch": 1.89, "percentage": 94.71, "elapsed_time": "18:01:25", "remaining_time": "1:00:27"} +{"current_steps": 6690, "total_steps": 7064, "loss": 0.7947, "reward": null, "learning_rate": 3.468678616200427e-07, "epoch": 1.89, "percentage": 94.71, "elapsed_time": "18:01:24", "remaining_time": "1:00:27"} +{"current_steps": 6690, "total_steps": 7064, "loss": 0.7947, "reward": null, "learning_rate": 3.468678616200427e-07, "epoch": 1.89, "percentage": 94.71, "elapsed_time": "18:01:26", "remaining_time": "1:00:27"} +{"current_steps": 6690, "total_steps": 7064, "loss": 0.7947, "reward": null, "learning_rate": 3.468678616200427e-07, "epoch": 1.89, "percentage": 94.71, "elapsed_time": "18:05:19", "remaining_time": "1:00:40"} +{"current_steps": 6700, "total_steps": 7064, "loss": 0.778, "reward": null, "learning_rate": 3.2865500524707217e-07, "epoch": 1.9, "percentage": 94.85, "elapsed_time": "18:03:04", "remaining_time": "0:58:50"} +{"current_steps": 6700, "total_steps": 7064, "loss": 0.778, "reward": null, "learning_rate": 3.2865500524707217e-07, "epoch": 1.9, "percentage": 94.85, "elapsed_time": "18:03:02", "remaining_time": "0:58:50"} +{"current_steps": 6700, "total_steps": 7064, "loss": 0.778, "reward": null, "learning_rate": 3.2865500524707217e-07, "epoch": 1.9, "percentage": 94.85, "elapsed_time": "18:06:57", "remaining_time": "0:59:03"} +{"current_steps": 6700, "total_steps": 7064, "loss": 0.778, "reward": null, "learning_rate": 3.2865500524707217e-07, "epoch": 1.9, "percentage": 94.85, "elapsed_time": "18:03:03", "remaining_time": "0:58:50"} +{"current_steps": 6710, "total_steps": 7064, "loss": 0.7822, "reward": null, "learning_rate": 3.109301158988609e-07, "epoch": 1.9, "percentage": 94.99, "elapsed_time": "18:04:40", "remaining_time": "0:57:13"} +{"current_steps": 6710, "total_steps": 7064, "loss": 0.7822, "reward": null, "learning_rate": 3.109301158988609e-07, "epoch": 1.9, "percentage": 94.99, "elapsed_time": "18:08:33", "remaining_time": "0:57:25"} +{"current_steps": 6710, "total_steps": 7064, "loss": 0.7822, "reward": null, "learning_rate": 3.109301158988609e-07, "epoch": 1.9, "percentage": 94.99, "elapsed_time": "18:04:40", "remaining_time": "0:57:13"} +{"current_steps": 6710, "total_steps": 7064, "loss": 0.7822, "reward": null, "learning_rate": 3.109301158988609e-07, "epoch": 1.9, "percentage": 94.99, "elapsed_time": "18:04:39", "remaining_time": "0:57:13"} +{"current_steps": 6720, "total_steps": 7064, "loss": 0.7796, "reward": null, "learning_rate": 2.936935441506028e-07, "epoch": 1.9, "percentage": 95.13, "elapsed_time": "18:06:16", "remaining_time": "0:55:36"} +{"current_steps": 6720, "total_steps": 7064, "loss": 0.7796, "reward": null, "learning_rate": 2.936935441506028e-07, "epoch": 1.9, "percentage": 95.13, "elapsed_time": "18:06:15", "remaining_time": "0:55:36"} +{"current_steps": 6720, "total_steps": 7064, "loss": 0.7796, "reward": null, "learning_rate": 2.936935441506028e-07, "epoch": 1.9, "percentage": 95.13, "elapsed_time": "18:10:09", "remaining_time": "0:55:48"} +{"current_steps": 6720, "total_steps": 7064, "loss": 0.7796, "reward": null, "learning_rate": 2.936935441506028e-07, "epoch": 1.9, "percentage": 95.13, "elapsed_time": "18:06:16", "remaining_time": "0:55:36"} +{"current_steps": 6730, "total_steps": 7064, "loss": 0.7749, "reward": null, "learning_rate": 2.769456309192037e-07, "epoch": 1.91, "percentage": 95.27, "elapsed_time": "18:11:48", "remaining_time": "0:54:11"} +{"current_steps": 6730, "total_steps": 7064, "loss": 0.7749, "reward": null, "learning_rate": 2.769456309192037e-07, "epoch": 1.91, "percentage": 95.27, "elapsed_time": "18:07:53", "remaining_time": "0:53:59"} +{"current_steps": 6730, "total_steps": 7064, "loss": 0.7749, "reward": null, "learning_rate": 2.769456309192037e-07, "epoch": 1.91, "percentage": 95.27, "elapsed_time": "18:07:54", "remaining_time": "0:53:59"} +{"current_steps": 6730, "total_steps": 7064, "loss": 0.7749, "reward": null, "learning_rate": 2.769456309192037e-07, "epoch": 1.91, "percentage": 95.27, "elapsed_time": "18:07:55", "remaining_time": "0:53:59"} +{"current_steps": 6740, "total_steps": 7064, "loss": 0.7731, "reward": null, "learning_rate": 2.6068670745654224e-07, "epoch": 1.91, "percentage": 95.41, "elapsed_time": "18:13:28", "remaining_time": "0:52:33"} +{"current_steps": 6740, "total_steps": 7064, "loss": 0.7731, "reward": null, "learning_rate": 2.6068670745654224e-07, "epoch": 1.91, "percentage": 95.41, "elapsed_time": "18:09:34", "remaining_time": "0:52:22"} +{"current_steps": 6740, "total_steps": 7064, "loss": 0.7731, "reward": null, "learning_rate": 2.6068670745654224e-07, "epoch": 1.91, "percentage": 95.41, "elapsed_time": "18:09:35", "remaining_time": "0:52:22"} +{"current_steps": 6740, "total_steps": 7064, "loss": 0.7731, "reward": null, "learning_rate": 2.6068670745654224e-07, "epoch": 1.91, "percentage": 95.41, "elapsed_time": "18:09:33", "remaining_time": "0:52:22"} +{"current_steps": 6750, "total_steps": 7064, "loss": 0.7696, "reward": null, "learning_rate": 2.449170953429225e-07, "epoch": 1.91, "percentage": 95.55, "elapsed_time": "18:11:13", "remaining_time": "0:50:45"} +{"current_steps": 6750, "total_steps": 7064, "loss": 0.7696, "reward": null, "learning_rate": 2.449170953429225e-07, "epoch": 1.91, "percentage": 95.55, "elapsed_time": "18:15:06", "remaining_time": "0:50:56"} +{"current_steps": 6750, "total_steps": 7064, "loss": 0.7696, "reward": null, "learning_rate": 2.449170953429225e-07, "epoch": 1.91, "percentage": 95.55, "elapsed_time": "18:11:12", "remaining_time": "0:50:45"} +{"current_steps": 6750, "total_steps": 7064, "loss": 0.7696, "reward": null, "learning_rate": 2.449170953429225e-07, "epoch": 1.91, "percentage": 95.55, "elapsed_time": "18:11:13", "remaining_time": "0:50:45"} +{"current_steps": 6760, "total_steps": 7064, "loss": 0.7868, "reward": null, "learning_rate": 2.296371064806957e-07, "epoch": 1.91, "percentage": 95.7, "elapsed_time": "18:12:49", "remaining_time": "0:49:08"} +{"current_steps": 6760, "total_steps": 7064, "loss": 0.7868, "reward": null, "learning_rate": 2.296371064806957e-07, "epoch": 1.91, "percentage": 95.7, "elapsed_time": "18:16:44", "remaining_time": "0:49:19"} +{"current_steps": 6760, "total_steps": 7064, "loss": 0.7868, "reward": null, "learning_rate": 2.296371064806957e-07, "epoch": 1.91, "percentage": 95.7, "elapsed_time": "18:12:51", "remaining_time": "0:49:08"} +{"current_steps": 6760, "total_steps": 7064, "loss": 0.7868, "reward": null, "learning_rate": 2.296371064806957e-07, "epoch": 1.91, "percentage": 95.7, "elapsed_time": "18:12:50", "remaining_time": "0:49:08"} +{"current_steps": 6770, "total_steps": 7064, "loss": 0.7805, "reward": null, "learning_rate": 2.1484704308812053e-07, "epoch": 1.92, "percentage": 95.84, "elapsed_time": "18:18:19", "remaining_time": "0:47:41"} +{"current_steps": 6770, "total_steps": 7064, "loss": 0.7805, "reward": null, "learning_rate": 2.1484704308812053e-07, "epoch": 1.92, "percentage": 95.84, "elapsed_time": "18:14:26", "remaining_time": "0:47:31"} +{"current_steps": 6770, "total_steps": 7064, "loss": 0.7805, "reward": null, "learning_rate": 2.1484704308812053e-07, "epoch": 1.92, "percentage": 95.84, "elapsed_time": "18:14:27", "remaining_time": "0:47:31"} +{"current_steps": 6770, "total_steps": 7064, "loss": 0.7805, "reward": null, "learning_rate": 2.1484704308812053e-07, "epoch": 1.92, "percentage": 95.84, "elapsed_time": "18:14:25", "remaining_time": "0:47:31"} +{"current_steps": 6780, "total_steps": 7064, "loss": 0.7802, "reward": null, "learning_rate": 2.0054719769335428e-07, "epoch": 1.92, "percentage": 95.98, "elapsed_time": "18:16:02", "remaining_time": "0:45:54"} +{"current_steps": 6780, "total_steps": 7064, "loss": 0.7802, "reward": null, "learning_rate": 2.0054719769335428e-07, "epoch": 1.92, "percentage": 95.98, "elapsed_time": "18:16:04", "remaining_time": "0:45:54"} +{"current_steps": 6780, "total_steps": 7064, "loss": 0.7802, "reward": null, "learning_rate": 2.0054719769335428e-07, "epoch": 1.92, "percentage": 95.98, "elapsed_time": "18:19:57", "remaining_time": "0:46:04"} +{"current_steps": 6780, "total_steps": 7064, "loss": 0.7802, "reward": null, "learning_rate": 2.0054719769335428e-07, "epoch": 1.92, "percentage": 95.98, "elapsed_time": "18:16:03", "remaining_time": "0:45:54"} +{"current_steps": 6790, "total_steps": 7064, "loss": 0.7787, "reward": null, "learning_rate": 1.8673785312869063e-07, "epoch": 1.92, "percentage": 96.12, "elapsed_time": "18:17:41", "remaining_time": "0:44:17"} +{"current_steps": 6790, "total_steps": 7064, "loss": 0.7787, "reward": null, "learning_rate": 1.8673785312869063e-07, "epoch": 1.92, "percentage": 96.12, "elapsed_time": "18:21:35", "remaining_time": "0:44:27"} +{"current_steps": 6790, "total_steps": 7064, "loss": 0.7787, "reward": null, "learning_rate": 1.8673785312869063e-07, "epoch": 1.92, "percentage": 96.12, "elapsed_time": "18:17:42", "remaining_time": "0:44:17"} +{"current_steps": 6790, "total_steps": 7064, "loss": 0.7787, "reward": null, "learning_rate": 1.8673785312869063e-07, "epoch": 1.92, "percentage": 96.12, "elapsed_time": "18:17:42", "remaining_time": "0:44:17"} +{"current_steps": 6800, "total_steps": 7064, "loss": 0.7886, "reward": null, "learning_rate": 1.7341928252495033e-07, "epoch": 1.93, "percentage": 96.26, "elapsed_time": "18:23:17", "remaining_time": "0:42:50"} +{"current_steps": 6800, "total_steps": 7064, "loss": 0.7886, "reward": null, "learning_rate": 1.7341928252495033e-07, "epoch": 1.93, "percentage": 96.26, "elapsed_time": "18:19:23", "remaining_time": "0:42:40"} +{"current_steps": 6800, "total_steps": 7064, "loss": 0.7886, "reward": null, "learning_rate": 1.7341928252495033e-07, "epoch": 1.93, "percentage": 96.26, "elapsed_time": "18:19:24", "remaining_time": "0:42:40"} +{"current_steps": 6800, "total_steps": 7064, "loss": 0.7886, "reward": null, "learning_rate": 1.7341928252495033e-07, "epoch": 1.93, "percentage": 96.26, "elapsed_time": "18:19:23", "remaining_time": "0:42:40"} +{"current_steps": 6810, "total_steps": 7064, "loss": 0.7902, "reward": null, "learning_rate": 1.60591749306091e-07, "epoch": 1.93, "percentage": 96.4, "elapsed_time": "18:21:00", "remaining_time": "0:41:03"} +{"current_steps": 6810, "total_steps": 7064, "loss": 0.7902, "reward": null, "learning_rate": 1.60591749306091e-07, "epoch": 1.93, "percentage": 96.4, "elapsed_time": "18:24:53", "remaining_time": "0:41:12"} +{"current_steps": 6810, "total_steps": 7064, "loss": 0.7902, "reward": null, "learning_rate": 1.60591749306091e-07, "epoch": 1.93, "percentage": 96.4, "elapsed_time": "18:21:01", "remaining_time": "0:41:03"} +{"current_steps": 6810, "total_steps": 7064, "loss": 0.7902, "reward": null, "learning_rate": 1.60591749306091e-07, "epoch": 1.93, "percentage": 96.4, "elapsed_time": "18:20:59", "remaining_time": "0:41:03"} +{"current_steps": 6820, "total_steps": 7064, "loss": 0.7577, "reward": null, "learning_rate": 1.4825550718398362e-07, "epoch": 1.93, "percentage": 96.55, "elapsed_time": "18:22:35", "remaining_time": "0:39:26"} +{"current_steps": 6820, "total_steps": 7064, "loss": 0.7577, "reward": null, "learning_rate": 1.4825550718398362e-07, "epoch": 1.93, "percentage": 96.55, "elapsed_time": "18:22:36", "remaining_time": "0:39:26"} +{"current_steps": 6820, "total_steps": 7064, "loss": 0.7577, "reward": null, "learning_rate": 1.4825550718398362e-07, "epoch": 1.93, "percentage": 96.55, "elapsed_time": "18:22:37", "remaining_time": "0:39:26"} +{"current_steps": 6820, "total_steps": 7064, "loss": 0.7577, "reward": null, "learning_rate": 1.4825550718398362e-07, "epoch": 1.93, "percentage": 96.55, "elapsed_time": "18:26:30", "remaining_time": "0:39:35"} +{"current_steps": 6830, "total_steps": 7064, "loss": 0.7703, "reward": null, "learning_rate": 1.3641080015341369e-07, "epoch": 1.93, "percentage": 96.69, "elapsed_time": "18:24:13", "remaining_time": "0:37:49"} +{"current_steps": 6830, "total_steps": 7064, "loss": 0.7703, "reward": null, "learning_rate": 1.3641080015341369e-07, "epoch": 1.93, "percentage": 96.69, "elapsed_time": "18:24:15", "remaining_time": "0:37:49"} +{"current_steps": 6830, "total_steps": 7064, "loss": 0.7703, "reward": null, "learning_rate": 1.3641080015341369e-07, "epoch": 1.93, "percentage": 96.69, "elapsed_time": "18:28:08", "remaining_time": "0:37:57"} +{"current_steps": 6830, "total_steps": 7064, "loss": 0.7703, "reward": null, "learning_rate": 1.3641080015341369e-07, "epoch": 1.93, "percentage": 96.69, "elapsed_time": "18:24:14", "remaining_time": "0:37:49"} +{"current_steps": 6840, "total_steps": 7064, "loss": 0.7588, "reward": null, "learning_rate": 1.2505786248723229e-07, "epoch": 1.94, "percentage": 96.83, "elapsed_time": "18:25:50", "remaining_time": "0:36:12"} +{"current_steps": 6840, "total_steps": 7064, "loss": 0.7588, "reward": null, "learning_rate": 1.2505786248723229e-07, "epoch": 1.94, "percentage": 96.83, "elapsed_time": "18:29:45", "remaining_time": "0:36:20"} +{"current_steps": 6840, "total_steps": 7064, "loss": 0.7588, "reward": null, "learning_rate": 1.2505786248723229e-07, "epoch": 1.94, "percentage": 96.83, "elapsed_time": "18:25:52", "remaining_time": "0:36:12"} +{"current_steps": 6840, "total_steps": 7064, "loss": 0.7588, "reward": null, "learning_rate": 1.2505786248723229e-07, "epoch": 1.94, "percentage": 96.83, "elapsed_time": "18:25:51", "remaining_time": "0:36:12"} +{"current_steps": 6850, "total_steps": 7064, "loss": 0.7651, "reward": null, "learning_rate": 1.1419691873174043e-07, "epoch": 1.94, "percentage": 96.97, "elapsed_time": "18:31:23", "remaining_time": "0:34:43"} +{"current_steps": 6850, "total_steps": 7064, "loss": 0.7651, "reward": null, "learning_rate": 1.1419691873174043e-07, "epoch": 1.94, "percentage": 96.97, "elapsed_time": "18:27:30", "remaining_time": "0:34:35"} +{"current_steps": 6850, "total_steps": 7064, "loss": 0.7651, "reward": null, "learning_rate": 1.1419691873174043e-07, "epoch": 1.94, "percentage": 96.97, "elapsed_time": "18:27:29", "remaining_time": "0:34:35"} +{"current_steps": 6850, "total_steps": 7064, "loss": 0.7651, "reward": null, "learning_rate": 1.1419691873174043e-07, "epoch": 1.94, "percentage": 96.97, "elapsed_time": "18:27:28", "remaining_time": "0:34:35"} +{"current_steps": 6860, "total_steps": 7064, "loss": 0.7739, "reward": null, "learning_rate": 1.038281837022398e-07, "epoch": 1.94, "percentage": 97.11, "elapsed_time": "18:32:58", "remaining_time": "0:33:05"} +{"current_steps": 6860, "total_steps": 7064, "loss": 0.7739, "reward": null, "learning_rate": 1.038281837022398e-07, "epoch": 1.94, "percentage": 97.11, "elapsed_time": "18:29:03", "remaining_time": "0:32:58"} +{"current_steps": 6860, "total_steps": 7064, "loss": 0.7739, "reward": null, "learning_rate": 1.038281837022398e-07, "epoch": 1.94, "percentage": 97.11, "elapsed_time": "18:29:05", "remaining_time": "0:32:58"} +{"current_steps": 6860, "total_steps": 7064, "loss": 0.7739, "reward": null, "learning_rate": 1.038281837022398e-07, "epoch": 1.94, "percentage": 97.11, "elapsed_time": "18:29:04", "remaining_time": "0:32:58"} +{"current_steps": 6870, "total_steps": 7064, "loss": 0.7628, "reward": null, "learning_rate": 9.395186247878329e-08, "epoch": 1.95, "percentage": 97.25, "elapsed_time": "18:30:41", "remaining_time": "0:31:21"} +{"current_steps": 6870, "total_steps": 7064, "loss": 0.7628, "reward": null, "learning_rate": 9.395186247878329e-08, "epoch": 1.95, "percentage": 97.25, "elapsed_time": "18:30:43", "remaining_time": "0:31:21"} +{"current_steps": 6870, "total_steps": 7064, "loss": 0.7628, "reward": null, "learning_rate": 9.395186247878329e-08, "epoch": 1.95, "percentage": 97.25, "elapsed_time": "18:30:42", "remaining_time": "0:31:21"} +{"current_steps": 6870, "total_steps": 7064, "loss": 0.7628, "reward": null, "learning_rate": 9.395186247878329e-08, "epoch": 1.95, "percentage": 97.25, "elapsed_time": "18:34:36", "remaining_time": "0:31:28"} +{"current_steps": 6880, "total_steps": 7064, "loss": 0.7739, "reward": null, "learning_rate": 8.456815040212562e-08, "epoch": 1.95, "percentage": 97.4, "elapsed_time": "18:32:21", "remaining_time": "0:29:44"} +{"current_steps": 6880, "total_steps": 7064, "loss": 0.7739, "reward": null, "learning_rate": 8.456815040212562e-08, "epoch": 1.95, "percentage": 97.4, "elapsed_time": "18:36:16", "remaining_time": "0:29:51"} +{"current_steps": 6880, "total_steps": 7064, "loss": 0.7739, "reward": null, "learning_rate": 8.456815040212562e-08, "epoch": 1.95, "percentage": 97.4, "elapsed_time": "18:32:23", "remaining_time": "0:29:45"} +{"current_steps": 6880, "total_steps": 7064, "loss": 0.7739, "reward": null, "learning_rate": 8.456815040212562e-08, "epoch": 1.95, "percentage": 97.4, "elapsed_time": "18:32:22", "remaining_time": "0:29:44"} +{"current_steps": 6890, "total_steps": 7064, "loss": 0.7889, "reward": null, "learning_rate": 7.567723306984853e-08, "epoch": 1.95, "percentage": 97.54, "elapsed_time": "18:33:59", "remaining_time": "0:28:07"} +{"current_steps": 6890, "total_steps": 7064, "loss": 0.7889, "reward": null, "learning_rate": 7.567723306984853e-08, "epoch": 1.95, "percentage": 97.54, "elapsed_time": "18:34:00", "remaining_time": "0:28:07"} +{"current_steps": 6890, "total_steps": 7064, "loss": 0.7889, "reward": null, "learning_rate": 7.567723306984853e-08, "epoch": 1.95, "percentage": 97.54, "elapsed_time": "18:34:00", "remaining_time": "0:28:07"} +{"current_steps": 6890, "total_steps": 7064, "loss": 0.7889, "reward": null, "learning_rate": 7.567723306984853e-08, "epoch": 1.95, "percentage": 97.54, "elapsed_time": "18:37:53", "remaining_time": "0:28:13"} +{"current_steps": 6900, "total_steps": 7064, "loss": 0.7842, "reward": null, "learning_rate": 6.727928633270264e-08, "epoch": 1.95, "percentage": 97.68, "elapsed_time": "18:35:37", "remaining_time": "0:26:30"} +{"current_steps": 6900, "total_steps": 7064, "loss": 0.7842, "reward": null, "learning_rate": 6.727928633270264e-08, "epoch": 1.95, "percentage": 97.68, "elapsed_time": "18:35:38", "remaining_time": "0:26:31"} +{"current_steps": 6900, "total_steps": 7064, "loss": 0.7842, "reward": null, "learning_rate": 6.727928633270264e-08, "epoch": 1.95, "percentage": 97.68, "elapsed_time": "18:35:39", "remaining_time": "0:26:31"} +{"current_steps": 6900, "total_steps": 7064, "loss": 0.7842, "reward": null, "learning_rate": 6.727928633270264e-08, "epoch": 1.95, "percentage": 97.68, "elapsed_time": "18:39:32", "remaining_time": "0:26:36"} +{"current_steps": 6910, "total_steps": 7064, "loss": 0.7673, "reward": null, "learning_rate": 5.937447629112414e-08, "epoch": 1.96, "percentage": 97.82, "elapsed_time": "18:37:17", "remaining_time": "0:24:54"} +{"current_steps": 6910, "total_steps": 7064, "loss": 0.7673, "reward": null, "learning_rate": 5.937447629112414e-08, "epoch": 1.96, "percentage": 97.82, "elapsed_time": "18:41:11", "remaining_time": "0:24:59"} +{"current_steps": 6910, "total_steps": 7064, "loss": 0.7673, "reward": null, "learning_rate": 5.937447629112414e-08, "epoch": 1.96, "percentage": 97.82, "elapsed_time": "18:37:19", "remaining_time": "0:24:54"} +{"current_steps": 6910, "total_steps": 7064, "loss": 0.7673, "reward": null, "learning_rate": 5.937447629112414e-08, "epoch": 1.96, "percentage": 97.82, "elapsed_time": "18:37:18", "remaining_time": "0:24:54"} +{"current_steps": 6920, "total_steps": 7064, "loss": 0.7881, "reward": null, "learning_rate": 5.196295929193739e-08, "epoch": 1.96, "percentage": 97.96, "elapsed_time": "18:38:59", "remaining_time": "0:23:17"} +{"current_steps": 6920, "total_steps": 7064, "loss": 0.7881, "reward": null, "learning_rate": 5.196295929193739e-08, "epoch": 1.96, "percentage": 97.96, "elapsed_time": "18:42:52", "remaining_time": "0:23:21"} +{"current_steps": 6920, "total_steps": 7064, "loss": 0.7881, "reward": null, "learning_rate": 5.196295929193739e-08, "epoch": 1.96, "percentage": 97.96, "elapsed_time": "18:38:59", "remaining_time": "0:23:17"} +{"current_steps": 6920, "total_steps": 7064, "loss": 0.7881, "reward": null, "learning_rate": 5.196295929193739e-08, "epoch": 1.96, "percentage": 97.96, "elapsed_time": "18:38:58", "remaining_time": "0:23:17"} +{"current_steps": 6930, "total_steps": 7064, "loss": 0.7665, "reward": null, "learning_rate": 4.5044881925287994e-08, "epoch": 1.96, "percentage": 98.1, "elapsed_time": "18:40:36", "remaining_time": "0:21:40"} +{"current_steps": 6930, "total_steps": 7064, "loss": 0.7665, "reward": null, "learning_rate": 4.5044881925287994e-08, "epoch": 1.96, "percentage": 98.1, "elapsed_time": "18:40:36", "remaining_time": "0:21:40"} +{"current_steps": 6930, "total_steps": 7064, "loss": 0.7665, "reward": null, "learning_rate": 4.5044881925287994e-08, "epoch": 1.96, "percentage": 98.1, "elapsed_time": "18:44:29", "remaining_time": "0:21:44"} +{"current_steps": 6930, "total_steps": 7064, "loss": 0.7665, "reward": null, "learning_rate": 4.5044881925287994e-08, "epoch": 1.96, "percentage": 98.1, "elapsed_time": "18:40:35", "remaining_time": "0:21:40"} +{"current_steps": 6940, "total_steps": 7064, "loss": 0.7724, "reward": null, "learning_rate": 3.862038102172283e-08, "epoch": 1.96, "percentage": 98.24, "elapsed_time": "18:42:12", "remaining_time": "0:20:03"} +{"current_steps": 6940, "total_steps": 7064, "loss": 0.7724, "reward": null, "learning_rate": 3.862038102172283e-08, "epoch": 1.96, "percentage": 98.24, "elapsed_time": "18:46:07", "remaining_time": "0:20:07"} +{"current_steps": 6940, "total_steps": 7064, "loss": 0.7724, "reward": null, "learning_rate": 3.862038102172283e-08, "epoch": 1.96, "percentage": 98.24, "elapsed_time": "18:42:14", "remaining_time": "0:20:03"} +{"current_steps": 6940, "total_steps": 7064, "loss": 0.7724, "reward": null, "learning_rate": 3.862038102172283e-08, "epoch": 1.96, "percentage": 98.24, "elapsed_time": "18:42:13", "remaining_time": "0:20:03"} +{"current_steps": 6950, "total_steps": 7064, "loss": 0.7703, "reward": null, "learning_rate": 3.268958364948671e-08, "epoch": 1.97, "percentage": 98.39, "elapsed_time": "18:43:52", "remaining_time": "0:18:26"} +{"current_steps": 6950, "total_steps": 7064, "loss": 0.7703, "reward": null, "learning_rate": 3.268958364948671e-08, "epoch": 1.97, "percentage": 98.39, "elapsed_time": "18:43:50", "remaining_time": "0:18:26"} +{"current_steps": 6950, "total_steps": 7064, "loss": 0.7703, "reward": null, "learning_rate": 3.268958364948671e-08, "epoch": 1.97, "percentage": 98.39, "elapsed_time": "18:47:45", "remaining_time": "0:18:29"} +{"current_steps": 6950, "total_steps": 7064, "loss": 0.7703, "reward": null, "learning_rate": 3.268958364948671e-08, "epoch": 1.97, "percentage": 98.39, "elapsed_time": "18:43:51", "remaining_time": "0:18:26"} +{"current_steps": 6960, "total_steps": 7064, "loss": 0.7615, "reward": null, "learning_rate": 2.7252607112018823e-08, "epoch": 1.97, "percentage": 98.53, "elapsed_time": "18:45:28", "remaining_time": "0:16:49"} +{"current_steps": 6960, "total_steps": 7064, "loss": 0.7615, "reward": null, "learning_rate": 2.7252607112018823e-08, "epoch": 1.97, "percentage": 98.53, "elapsed_time": "18:45:29", "remaining_time": "0:16:49"} +{"current_steps": 6960, "total_steps": 7064, "loss": 0.7615, "reward": null, "learning_rate": 2.7252607112018823e-08, "epoch": 1.97, "percentage": 98.53, "elapsed_time": "18:45:30", "remaining_time": "0:16:49"} +{"current_steps": 6960, "total_steps": 7064, "loss": 0.7615, "reward": null, "learning_rate": 2.7252607112018823e-08, "epoch": 1.97, "percentage": 98.53, "elapsed_time": "18:49:23", "remaining_time": "0:16:52"} +{"current_steps": 6970, "total_steps": 7064, "loss": 0.7853, "reward": null, "learning_rate": 2.2309558945621257e-08, "epoch": 1.97, "percentage": 98.67, "elapsed_time": "18:47:02", "remaining_time": "0:15:11"} +{"current_steps": 6970, "total_steps": 7064, "loss": 0.7853, "reward": null, "learning_rate": 2.2309558945621257e-08, "epoch": 1.97, "percentage": 98.67, "elapsed_time": "18:47:03", "remaining_time": "0:15:11"} +{"current_steps": 6970, "total_steps": 7064, "loss": 0.7853, "reward": null, "learning_rate": 2.2309558945621257e-08, "epoch": 1.97, "percentage": 98.67, "elapsed_time": "18:50:56", "remaining_time": "0:15:15"} +{"current_steps": 6970, "total_steps": 7064, "loss": 0.7853, "reward": null, "learning_rate": 2.2309558945621257e-08, "epoch": 1.97, "percentage": 98.67, "elapsed_time": "18:47:03", "remaining_time": "0:15:12"} +{"current_steps": 6980, "total_steps": 7064, "loss": 0.764, "reward": null, "learning_rate": 1.7860536917341243e-08, "epoch": 1.98, "percentage": 98.81, "elapsed_time": "18:52:38", "remaining_time": "0:13:37"} +{"current_steps": 6980, "total_steps": 7064, "loss": 0.764, "reward": null, "learning_rate": 1.7860536917341243e-08, "epoch": 1.98, "percentage": 98.81, "elapsed_time": "18:48:44", "remaining_time": "0:13:35"} +{"current_steps": 6980, "total_steps": 7064, "loss": 0.764, "reward": null, "learning_rate": 1.7860536917341243e-08, "epoch": 1.98, "percentage": 98.81, "elapsed_time": "18:48:45", "remaining_time": "0:13:35"} +{"current_steps": 6980, "total_steps": 7064, "loss": 0.764, "reward": null, "learning_rate": 1.7860536917341243e-08, "epoch": 1.98, "percentage": 98.81, "elapsed_time": "18:48:44", "remaining_time": "0:13:35"} +{"current_steps": 6990, "total_steps": 7064, "loss": 0.773, "reward": null, "learning_rate": 1.3905629023031052e-08, "epoch": 1.98, "percentage": 98.95, "elapsed_time": "18:54:17", "remaining_time": "0:12:00"} +{"current_steps": 6990, "total_steps": 7064, "loss": 0.773, "reward": null, "learning_rate": 1.3905629023031052e-08, "epoch": 1.98, "percentage": 98.95, "elapsed_time": "18:50:24", "remaining_time": "0:11:58"} +{"current_steps": 6990, "total_steps": 7064, "loss": 0.773, "reward": null, "learning_rate": 1.3905629023031052e-08, "epoch": 1.98, "percentage": 98.95, "elapsed_time": "18:50:23", "remaining_time": "0:11:58"} +{"current_steps": 6990, "total_steps": 7064, "loss": 0.773, "reward": null, "learning_rate": 1.3905629023031052e-08, "epoch": 1.98, "percentage": 98.95, "elapsed_time": "18:50:23", "remaining_time": "0:11:58"} +{"current_steps": 7000, "total_steps": 7064, "loss": 0.7812, "reward": null, "learning_rate": 1.0444913485610498e-08, "epoch": 1.98, "percentage": 99.09, "elapsed_time": "18:52:05", "remaining_time": "0:10:21"} +{"current_steps": 7000, "total_steps": 7064, "loss": 0.7812, "reward": null, "learning_rate": 1.0444913485610498e-08, "epoch": 1.98, "percentage": 99.09, "elapsed_time": "18:55:59", "remaining_time": "0:10:23"} +{"current_steps": 7000, "total_steps": 7064, "loss": 0.7812, "reward": null, "learning_rate": 1.0444913485610498e-08, "epoch": 1.98, "percentage": 99.09, "elapsed_time": "18:52:07", "remaining_time": "0:10:21"} +{"current_steps": 7000, "total_steps": 7064, "loss": 0.7812, "reward": null, "learning_rate": 1.0444913485610498e-08, "epoch": 1.98, "percentage": 99.09, "elapsed_time": "18:52:06", "remaining_time": "0:10:21"} +{"current_steps": 7010, "total_steps": 7064, "loss": 0.7781, "reward": null, "learning_rate": 7.478458753518159e-09, "epoch": 1.98, "percentage": 99.24, "elapsed_time": "18:53:43", "remaining_time": "0:08:44"} +{"current_steps": 7010, "total_steps": 7064, "loss": 0.7781, "reward": null, "learning_rate": 7.478458753518159e-09, "epoch": 1.98, "percentage": 99.24, "elapsed_time": "18:53:44", "remaining_time": "0:08:44"} +{"current_steps": 7010, "total_steps": 7064, "loss": 0.7781, "reward": null, "learning_rate": 7.478458753518159e-09, "epoch": 1.98, "percentage": 99.24, "elapsed_time": "18:57:37", "remaining_time": "0:08:45"} +{"current_steps": 7010, "total_steps": 7064, "loss": 0.7781, "reward": null, "learning_rate": 7.478458753518159e-09, "epoch": 1.98, "percentage": 99.24, "elapsed_time": "18:53:44", "remaining_time": "0:08:44"} +{"current_steps": 7020, "total_steps": 7064, "loss": 0.7871, "reward": null, "learning_rate": 5.006323499359699e-09, "epoch": 1.99, "percentage": 99.38, "elapsed_time": "18:59:15", "remaining_time": "0:07:08"} +{"current_steps": 7020, "total_steps": 7064, "loss": 0.7871, "reward": null, "learning_rate": 5.006323499359699e-09, "epoch": 1.99, "percentage": 99.38, "elapsed_time": "18:55:20", "remaining_time": "0:07:06"} +{"current_steps": 7020, "total_steps": 7064, "loss": 0.7871, "reward": null, "learning_rate": 5.006323499359699e-09, "epoch": 1.99, "percentage": 99.38, "elapsed_time": "18:55:21", "remaining_time": "0:07:06"} +{"current_steps": 7020, "total_steps": 7064, "loss": 0.7871, "reward": null, "learning_rate": 5.006323499359699e-09, "epoch": 1.99, "percentage": 99.38, "elapsed_time": "18:55:22", "remaining_time": "0:07:06"} +{"current_steps": 7030, "total_steps": 7064, "loss": 0.7657, "reward": null, "learning_rate": 3.02855661874768e-09, "epoch": 1.99, "percentage": 99.52, "elapsed_time": "18:56:58", "remaining_time": "0:05:29"} +{"current_steps": 7030, "total_steps": 7064, "loss": 0.7657, "reward": null, "learning_rate": 3.02855661874768e-09, "epoch": 1.99, "percentage": 99.52, "elapsed_time": "18:56:57", "remaining_time": "0:05:29"} +{"current_steps": 7030, "total_steps": 7064, "loss": 0.7657, "reward": null, "learning_rate": 3.02855661874768e-09, "epoch": 1.99, "percentage": 99.52, "elapsed_time": "19:00:52", "remaining_time": "0:05:31"} +{"current_steps": 7030, "total_steps": 7064, "loss": 0.7657, "reward": null, "learning_rate": 3.02855661874768e-09, "epoch": 1.99, "percentage": 99.52, "elapsed_time": "18:56:59", "remaining_time": "0:05:29"} +{"current_steps": 7040, "total_steps": 7064, "loss": 0.7674, "reward": null, "learning_rate": 1.5451972293301087e-09, "epoch": 1.99, "percentage": 99.66, "elapsed_time": "18:58:34", "remaining_time": "0:03:52"} +{"current_steps": 7040, "total_steps": 7064, "loss": 0.7674, "reward": null, "learning_rate": 1.5451972293301087e-09, "epoch": 1.99, "percentage": 99.66, "elapsed_time": "19:02:29", "remaining_time": "0:03:53"} +{"current_steps": 7040, "total_steps": 7064, "loss": 0.7674, "reward": null, "learning_rate": 1.5451972293301087e-09, "epoch": 1.99, "percentage": 99.66, "elapsed_time": "18:58:35", "remaining_time": "0:03:52"} +{"current_steps": 7040, "total_steps": 7064, "loss": 0.7674, "reward": null, "learning_rate": 1.5451972293301087e-09, "epoch": 1.99, "percentage": 99.66, "elapsed_time": "18:58:36", "remaining_time": "0:03:52"} +{"current_steps": 7050, "total_steps": 7064, "loss": 0.7881, "reward": null, "learning_rate": 5.56274670021617e-10, "epoch": 2.0, "percentage": 99.8, "elapsed_time": "19:00:10", "remaining_time": "0:02:15"} +{"current_steps": 7050, "total_steps": 7064, "loss": 0.7881, "reward": null, "learning_rate": 5.56274670021617e-10, "epoch": 2.0, "percentage": 99.8, "elapsed_time": "19:00:09", "remaining_time": "0:02:15"} +{"current_steps": 7050, "total_steps": 7064, "loss": 0.7881, "reward": null, "learning_rate": 5.56274670021617e-10, "epoch": 2.0, "percentage": 99.8, "elapsed_time": "19:04:04", "remaining_time": "0:02:16"} +{"current_steps": 7050, "total_steps": 7064, "loss": 0.7881, "reward": null, "learning_rate": 5.56274670021617e-10, "epoch": 2.0, "percentage": 99.8, "elapsed_time": "19:00:11", "remaining_time": "0:02:15"} +{"current_steps": 7060, "total_steps": 7064, "loss": 0.8101, "reward": null, "learning_rate": 6.180850041781483e-11, "epoch": 2.0, "percentage": 99.94, "elapsed_time": "19:01:48", "remaining_time": "0:00:38"} +{"current_steps": 7060, "total_steps": 7064, "loss": 0.8101, "reward": null, "learning_rate": 6.180850041781483e-11, "epoch": 2.0, "percentage": 99.94, "elapsed_time": "19:05:41", "remaining_time": "0:00:38"} +{"current_steps": 7060, "total_steps": 7064, "loss": 0.8101, "reward": null, "learning_rate": 6.180850041781483e-11, "epoch": 2.0, "percentage": 99.94, "elapsed_time": "19:01:47", "remaining_time": "0:00:38"} +{"current_steps": 7060, "total_steps": 7064, "loss": 0.8101, "reward": null, "learning_rate": 6.180850041781483e-11, "epoch": 2.0, "percentage": 99.94, "elapsed_time": "19:01:48", "remaining_time": "0:00:38"} diff --git a/sft-lora/trainer_state.json b/sft-lora/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..4083c3c360cdcea113a6a1d0f052dce359b38b9c --- /dev/null +++ b/sft-lora/trainer_state.json @@ -0,0 +1,4261 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 2.0, + "global_step": 7064, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.0, + "learning_rate": 4.9999752766303955e-05, + "loss": 1.293, + "step": 10 + }, + { + "epoch": 0.01, + "learning_rate": 4.999901107010577e-05, + "loss": 1.2584, + "step": 20 + }, + { + "epoch": 0.01, + "learning_rate": 4.999777492607524e-05, + "loss": 1.2075, + "step": 30 + }, + { + "epoch": 0.01, + "learning_rate": 4.9996044358661676e-05, + "loss": 1.1718, + "step": 40 + }, + { + "epoch": 0.01, + "learning_rate": 4.9993819402093446e-05, + "loss": 1.1483, + "step": 50 + }, + { + "epoch": 0.02, + "learning_rate": 4.999110010037728e-05, + "loss": 1.122, + "step": 60 + }, + { + "epoch": 0.02, + "learning_rate": 4.998788650729743e-05, + "loss": 1.0971, + "step": 70 + }, + { + "epoch": 0.02, + "learning_rate": 4.998417868641457e-05, + "loss": 1.0756, + "step": 80 + }, + { + "epoch": 0.03, + "learning_rate": 4.9979976711064556e-05, + "loss": 1.0673, + "step": 90 + }, + { + "epoch": 0.03, + "learning_rate": 4.9975280664357e-05, + "loss": 1.0705, + "step": 100 + }, + { + "epoch": 0.03, + "learning_rate": 4.997009063917356e-05, + "loss": 1.0673, + "step": 110 + }, + { + "epoch": 0.03, + "learning_rate": 4.996440673816617e-05, + "loss": 1.031, + "step": 120 + }, + { + "epoch": 0.04, + "learning_rate": 4.995822907375498e-05, + "loss": 1.0383, + "step": 130 + }, + { + "epoch": 0.04, + "learning_rate": 4.9951557768126136e-05, + "loss": 1.0097, + "step": 140 + }, + { + "epoch": 0.04, + "learning_rate": 4.9944392953229365e-05, + "loss": 1.012, + "step": 150 + }, + { + "epoch": 0.05, + "learning_rate": 4.993673477077535e-05, + "loss": 0.9834, + "step": 160 + }, + { + "epoch": 0.05, + "learning_rate": 4.9928583372232954e-05, + "loss": 0.9908, + "step": 170 + }, + { + "epoch": 0.05, + "learning_rate": 4.991993891882622e-05, + "loss": 0.9908, + "step": 180 + }, + { + "epoch": 0.05, + "learning_rate": 4.991080158153115e-05, + "loss": 0.9913, + "step": 190 + }, + { + "epoch": 0.06, + "learning_rate": 4.990117154107236e-05, + "loss": 0.9782, + "step": 200 + }, + { + "epoch": 0.06, + "learning_rate": 4.989104898791949e-05, + "loss": 0.9954, + "step": 210 + }, + { + "epoch": 0.06, + "learning_rate": 4.988043412228343e-05, + "loss": 0.975, + "step": 220 + }, + { + "epoch": 0.07, + "learning_rate": 4.986932715411239e-05, + "loss": 0.9687, + "step": 230 + }, + { + "epoch": 0.07, + "learning_rate": 4.985772830308771e-05, + "loss": 0.9677, + "step": 240 + }, + { + "epoch": 0.07, + "learning_rate": 4.9845637798619536e-05, + "loss": 0.9715, + "step": 250 + }, + { + "epoch": 0.07, + "learning_rate": 4.983305587984227e-05, + "loss": 0.9692, + "step": 260 + }, + { + "epoch": 0.08, + "learning_rate": 4.981998279560986e-05, + "loss": 0.9627, + "step": 270 + }, + { + "epoch": 0.08, + "learning_rate": 4.980641880449086e-05, + "loss": 0.9784, + "step": 280 + }, + { + "epoch": 0.08, + "learning_rate": 4.9792364174763323e-05, + "loss": 0.941, + "step": 290 + }, + { + "epoch": 0.08, + "learning_rate": 4.977781918440949e-05, + "loss": 0.9623, + "step": 300 + }, + { + "epoch": 0.09, + "learning_rate": 4.97627841211103e-05, + "loss": 0.9401, + "step": 310 + }, + { + "epoch": 0.09, + "learning_rate": 4.97472592822397e-05, + "loss": 0.9152, + "step": 320 + }, + { + "epoch": 0.09, + "learning_rate": 4.9731244974858746e-05, + "loss": 0.9405, + "step": 330 + }, + { + "epoch": 0.1, + "learning_rate": 4.971474151570955e-05, + "loss": 0.9431, + "step": 340 + }, + { + "epoch": 0.1, + "learning_rate": 4.9697749231209025e-05, + "loss": 0.9512, + "step": 350 + }, + { + "epoch": 0.1, + "learning_rate": 4.968026845744237e-05, + "loss": 0.9301, + "step": 360 + }, + { + "epoch": 0.1, + "learning_rate": 4.96622995401565e-05, + "loss": 0.917, + "step": 370 + }, + { + "epoch": 0.11, + "learning_rate": 4.9643842834753174e-05, + "loss": 0.9162, + "step": 380 + }, + { + "epoch": 0.11, + "learning_rate": 4.962489870628193e-05, + "loss": 0.9207, + "step": 390 + }, + { + "epoch": 0.11, + "learning_rate": 4.960546752943294e-05, + "loss": 0.924, + "step": 400 + }, + { + "epoch": 0.12, + "learning_rate": 4.958554968852952e-05, + "loss": 0.9025, + "step": 410 + }, + { + "epoch": 0.12, + "learning_rate": 4.95651455775206e-05, + "loss": 0.9027, + "step": 420 + }, + { + "epoch": 0.12, + "learning_rate": 4.954425559997287e-05, + "loss": 0.9167, + "step": 430 + }, + { + "epoch": 0.12, + "learning_rate": 4.952288016906284e-05, + "loss": 0.9119, + "step": 440 + }, + { + "epoch": 0.13, + "learning_rate": 4.9501019707568665e-05, + "loss": 0.9042, + "step": 450 + }, + { + "epoch": 0.13, + "learning_rate": 4.947867464786174e-05, + "loss": 0.9113, + "step": 460 + }, + { + "epoch": 0.13, + "learning_rate": 4.945584543189823e-05, + "loss": 0.9297, + "step": 470 + }, + { + "epoch": 0.14, + "learning_rate": 4.943253251121022e-05, + "loss": 0.9194, + "step": 480 + }, + { + "epoch": 0.14, + "learning_rate": 4.9408736346896894e-05, + "loss": 0.8978, + "step": 490 + }, + { + "epoch": 0.14, + "learning_rate": 4.938445740961534e-05, + "loss": 0.9217, + "step": 500 + }, + { + "epoch": 0.14, + "learning_rate": 4.935969617957126e-05, + "loss": 0.8997, + "step": 510 + }, + { + "epoch": 0.15, + "learning_rate": 4.93344531465095e-05, + "loss": 0.9045, + "step": 520 + }, + { + "epoch": 0.15, + "learning_rate": 4.930872880970432e-05, + "loss": 0.8985, + "step": 530 + }, + { + "epoch": 0.15, + "learning_rate": 4.9282523677949556e-05, + "loss": 0.9171, + "step": 540 + }, + { + "epoch": 0.16, + "learning_rate": 4.9255838269548524e-05, + "loss": 0.9001, + "step": 550 + }, + { + "epoch": 0.16, + "learning_rate": 4.9228673112303814e-05, + "loss": 0.8824, + "step": 560 + }, + { + "epoch": 0.16, + "learning_rate": 4.9201028743506794e-05, + "loss": 0.9046, + "step": 570 + }, + { + "epoch": 0.16, + "learning_rate": 4.917290570992702e-05, + "loss": 0.8888, + "step": 580 + }, + { + "epoch": 0.17, + "learning_rate": 4.9144304567801415e-05, + "loss": 0.889, + "step": 590 + }, + { + "epoch": 0.17, + "learning_rate": 4.911522588282327e-05, + "loss": 0.906, + "step": 600 + }, + { + "epoch": 0.17, + "learning_rate": 4.908567023013104e-05, + "loss": 0.8858, + "step": 610 + }, + { + "epoch": 0.18, + "learning_rate": 4.9055638194296994e-05, + "loss": 0.8862, + "step": 620 + }, + { + "epoch": 0.18, + "learning_rate": 4.902513036931562e-05, + "loss": 0.8983, + "step": 630 + }, + { + "epoch": 0.18, + "learning_rate": 4.89941473585919e-05, + "loss": 0.8967, + "step": 640 + }, + { + "epoch": 0.18, + "learning_rate": 4.89626897749294e-05, + "loss": 0.8925, + "step": 650 + }, + { + "epoch": 0.19, + "learning_rate": 4.893075824051807e-05, + "loss": 0.883, + "step": 660 + }, + { + "epoch": 0.19, + "learning_rate": 4.889835338692201e-05, + "loss": 0.8823, + "step": 670 + }, + { + "epoch": 0.19, + "learning_rate": 4.886547585506698e-05, + "loss": 0.8937, + "step": 680 + }, + { + "epoch": 0.2, + "learning_rate": 4.8832126295227656e-05, + "loss": 0.8695, + "step": 690 + }, + { + "epoch": 0.2, + "learning_rate": 4.879830536701485e-05, + "loss": 0.8873, + "step": 700 + }, + { + "epoch": 0.2, + "learning_rate": 4.876401373936239e-05, + "loss": 0.8862, + "step": 710 + }, + { + "epoch": 0.2, + "learning_rate": 4.8729252090513964e-05, + "loss": 0.874, + "step": 720 + }, + { + "epoch": 0.21, + "learning_rate": 4.869402110800963e-05, + "loss": 0.8834, + "step": 730 + }, + { + "epoch": 0.21, + "learning_rate": 4.865832148867228e-05, + "loss": 0.8744, + "step": 740 + }, + { + "epoch": 0.21, + "learning_rate": 4.8622153938593816e-05, + "loss": 0.876, + "step": 750 + }, + { + "epoch": 0.22, + "learning_rate": 4.8585519173121205e-05, + "loss": 0.8874, + "step": 760 + }, + { + "epoch": 0.22, + "learning_rate": 4.8548417916842324e-05, + "loss": 0.8938, + "step": 770 + }, + { + "epoch": 0.22, + "learning_rate": 4.851085090357163e-05, + "loss": 0.8855, + "step": 780 + }, + { + "epoch": 0.22, + "learning_rate": 4.847281887633565e-05, + "loss": 0.8827, + "step": 790 + }, + { + "epoch": 0.23, + "learning_rate": 4.843432258735827e-05, + "loss": 0.8736, + "step": 800 + }, + { + "epoch": 0.23, + "learning_rate": 4.839536279804589e-05, + "loss": 0.8907, + "step": 810 + }, + { + "epoch": 0.23, + "learning_rate": 4.835594027897231e-05, + "loss": 0.862, + "step": 820 + }, + { + "epoch": 0.23, + "learning_rate": 4.831605580986355e-05, + "loss": 0.8796, + "step": 830 + }, + { + "epoch": 0.24, + "learning_rate": 4.8275710179582366e-05, + "loss": 0.8745, + "step": 840 + }, + { + "epoch": 0.24, + "learning_rate": 4.823490418611273e-05, + "loss": 0.8594, + "step": 850 + }, + { + "epoch": 0.24, + "learning_rate": 4.819363863654395e-05, + "loss": 0.8839, + "step": 860 + }, + { + "epoch": 0.25, + "learning_rate": 4.8151914347054776e-05, + "loss": 0.8536, + "step": 870 + }, + { + "epoch": 0.25, + "learning_rate": 4.810973214289724e-05, + "loss": 0.8765, + "step": 880 + }, + { + "epoch": 0.25, + "learning_rate": 4.806709285838031e-05, + "loss": 0.8726, + "step": 890 + }, + { + "epoch": 0.25, + "learning_rate": 4.8023997336853434e-05, + "loss": 0.8664, + "step": 900 + }, + { + "epoch": 0.26, + "learning_rate": 4.7980446430689804e-05, + "loss": 0.8805, + "step": 910 + }, + { + "epoch": 0.26, + "learning_rate": 4.793644100126954e-05, + "loss": 0.878, + "step": 920 + }, + { + "epoch": 0.26, + "learning_rate": 4.7891981918962656e-05, + "loss": 0.8632, + "step": 930 + }, + { + "epoch": 0.27, + "learning_rate": 4.784707006311179e-05, + "loss": 0.8614, + "step": 940 + }, + { + "epoch": 0.27, + "learning_rate": 4.780170632201487e-05, + "loss": 0.8629, + "step": 950 + }, + { + "epoch": 0.27, + "learning_rate": 4.7755891592907556e-05, + "loss": 0.8635, + "step": 960 + }, + { + "epoch": 0.27, + "learning_rate": 4.7709626781945397e-05, + "loss": 0.8525, + "step": 970 + }, + { + "epoch": 0.28, + "learning_rate": 4.766291280418603e-05, + "loss": 0.8592, + "step": 980 + }, + { + "epoch": 0.28, + "learning_rate": 4.761575058357101e-05, + "loss": 0.8621, + "step": 990 + }, + { + "epoch": 0.28, + "learning_rate": 4.756814105290753e-05, + "loss": 0.8687, + "step": 1000 + }, + { + "epoch": 0.29, + "learning_rate": 4.7520085153850014e-05, + "loss": 0.8524, + "step": 1010 + }, + { + "epoch": 0.29, + "learning_rate": 4.7471583836881476e-05, + "loss": 0.8687, + "step": 1020 + }, + { + "epoch": 0.29, + "learning_rate": 4.742263806129469e-05, + "loss": 0.8505, + "step": 1030 + }, + { + "epoch": 0.29, + "learning_rate": 4.737324879517326e-05, + "loss": 0.8754, + "step": 1040 + }, + { + "epoch": 0.3, + "learning_rate": 4.732341701537245e-05, + "loss": 0.8583, + "step": 1050 + }, + { + "epoch": 0.3, + "learning_rate": 4.727314370749988e-05, + "loss": 0.8698, + "step": 1060 + }, + { + "epoch": 0.3, + "learning_rate": 4.7222429865896e-05, + "loss": 0.8661, + "step": 1070 + }, + { + "epoch": 0.31, + "learning_rate": 4.717127649361444e-05, + "loss": 0.8574, + "step": 1080 + }, + { + "epoch": 0.31, + "learning_rate": 4.71196846024022e-05, + "loss": 0.852, + "step": 1090 + }, + { + "epoch": 0.31, + "learning_rate": 4.7067655212679585e-05, + "loss": 0.8619, + "step": 1100 + }, + { + "epoch": 0.31, + "learning_rate": 4.701518935352006e-05, + "loss": 0.8632, + "step": 1110 + }, + { + "epoch": 0.32, + "learning_rate": 4.69622880626299e-05, + "loss": 0.8529, + "step": 1120 + }, + { + "epoch": 0.32, + "learning_rate": 4.690895238632762e-05, + "loss": 0.8529, + "step": 1130 + }, + { + "epoch": 0.32, + "learning_rate": 4.685518337952335e-05, + "loss": 0.8465, + "step": 1140 + }, + { + "epoch": 0.33, + "learning_rate": 4.680098210569789e-05, + "loss": 0.8604, + "step": 1150 + }, + { + "epoch": 0.33, + "learning_rate": 4.674634963688177e-05, + "loss": 0.8649, + "step": 1160 + }, + { + "epoch": 0.33, + "learning_rate": 4.669128705363394e-05, + "loss": 0.8572, + "step": 1170 + }, + { + "epoch": 0.33, + "learning_rate": 4.663579544502049e-05, + "loss": 0.8634, + "step": 1180 + }, + { + "epoch": 0.34, + "learning_rate": 4.657987590859305e-05, + "loss": 0.8478, + "step": 1190 + }, + { + "epoch": 0.34, + "learning_rate": 4.652352955036713e-05, + "loss": 0.8475, + "step": 1200 + }, + { + "epoch": 0.34, + "learning_rate": 4.646675748480019e-05, + "loss": 0.8537, + "step": 1210 + }, + { + "epoch": 0.35, + "learning_rate": 4.640956083476964e-05, + "loss": 0.8499, + "step": 1220 + }, + { + "epoch": 0.35, + "learning_rate": 4.635194073155061e-05, + "loss": 0.8467, + "step": 1230 + }, + { + "epoch": 0.35, + "learning_rate": 4.62938983147936e-05, + "loss": 0.8538, + "step": 1240 + }, + { + "epoch": 0.35, + "learning_rate": 4.62354347325019e-05, + "loss": 0.8619, + "step": 1250 + }, + { + "epoch": 0.36, + "learning_rate": 4.6176551141008916e-05, + "loss": 0.8593, + "step": 1260 + }, + { + "epoch": 0.36, + "learning_rate": 4.611724870495528e-05, + "loss": 0.8484, + "step": 1270 + }, + { + "epoch": 0.36, + "learning_rate": 4.605752859726583e-05, + "loss": 0.8395, + "step": 1280 + }, + { + "epoch": 0.37, + "learning_rate": 4.5997391999126397e-05, + "loss": 0.8547, + "step": 1290 + }, + { + "epoch": 0.37, + "learning_rate": 4.5936840099960465e-05, + "loss": 0.8586, + "step": 1300 + }, + { + "epoch": 0.37, + "learning_rate": 4.587587409740561e-05, + "loss": 0.839, + "step": 1310 + }, + { + "epoch": 0.37, + "learning_rate": 4.581449519728986e-05, + "loss": 0.8417, + "step": 1320 + }, + { + "epoch": 0.38, + "learning_rate": 4.575270461360779e-05, + "loss": 0.8404, + "step": 1330 + }, + { + "epoch": 0.38, + "learning_rate": 4.569050356849655e-05, + "loss": 0.843, + "step": 1340 + }, + { + "epoch": 0.38, + "learning_rate": 4.562789329221169e-05, + "loss": 0.8557, + "step": 1350 + }, + { + "epoch": 0.39, + "learning_rate": 4.5564875023102796e-05, + "loss": 0.8504, + "step": 1360 + }, + { + "epoch": 0.39, + "learning_rate": 4.550145000758905e-05, + "loss": 0.8579, + "step": 1370 + }, + { + "epoch": 0.39, + "learning_rate": 4.543761950013453e-05, + "loss": 0.8563, + "step": 1380 + }, + { + "epoch": 0.39, + "learning_rate": 4.537338476322341e-05, + "loss": 0.8446, + "step": 1390 + }, + { + "epoch": 0.4, + "learning_rate": 4.530874706733502e-05, + "loss": 0.8524, + "step": 1400 + }, + { + "epoch": 0.4, + "learning_rate": 4.524370769091866e-05, + "loss": 0.8417, + "step": 1410 + }, + { + "epoch": 0.4, + "learning_rate": 4.5178267920368366e-05, + "loss": 0.8582, + "step": 1420 + }, + { + "epoch": 0.4, + "learning_rate": 4.511242904999746e-05, + "loss": 0.841, + "step": 1430 + }, + { + "epoch": 0.41, + "learning_rate": 4.50461923820129e-05, + "loss": 0.8529, + "step": 1440 + }, + { + "epoch": 0.41, + "learning_rate": 4.497955922648961e-05, + "loss": 0.8545, + "step": 1450 + }, + { + "epoch": 0.41, + "learning_rate": 4.491253090134447e-05, + "loss": 0.8471, + "step": 1460 + }, + { + "epoch": 0.42, + "learning_rate": 4.4845108732310355e-05, + "loss": 0.8379, + "step": 1470 + }, + { + "epoch": 0.42, + "learning_rate": 4.4777294052909804e-05, + "loss": 0.8542, + "step": 1480 + }, + { + "epoch": 0.42, + "learning_rate": 4.470908820442873e-05, + "loss": 0.8463, + "step": 1490 + }, + { + "epoch": 0.42, + "learning_rate": 4.464049253588985e-05, + "loss": 0.8362, + "step": 1500 + }, + { + "epoch": 0.43, + "learning_rate": 4.457150840402604e-05, + "loss": 0.8467, + "step": 1510 + }, + { + "epoch": 0.43, + "learning_rate": 4.450213717325343e-05, + "loss": 0.8501, + "step": 1520 + }, + { + "epoch": 0.43, + "learning_rate": 4.443238021564448e-05, + "loss": 0.8541, + "step": 1530 + }, + { + "epoch": 0.44, + "learning_rate": 4.4362238910900835e-05, + "loss": 0.8443, + "step": 1540 + }, + { + "epoch": 0.44, + "learning_rate": 4.4291714646326024e-05, + "loss": 0.8297, + "step": 1550 + }, + { + "epoch": 0.44, + "learning_rate": 4.4220808816797995e-05, + "loss": 0.8532, + "step": 1560 + }, + { + "epoch": 0.44, + "learning_rate": 4.414952282474158e-05, + "loss": 0.854, + "step": 1570 + }, + { + "epoch": 0.45, + "learning_rate": 4.407785808010073e-05, + "loss": 0.849, + "step": 1580 + }, + { + "epoch": 0.45, + "learning_rate": 4.400581600031062e-05, + "loss": 0.8516, + "step": 1590 + }, + { + "epoch": 0.45, + "learning_rate": 4.3933398010269614e-05, + "loss": 0.8394, + "step": 1600 + }, + { + "epoch": 0.46, + "learning_rate": 4.386060554231111e-05, + "loss": 0.8399, + "step": 1610 + }, + { + "epoch": 0.46, + "learning_rate": 4.378744003617517e-05, + "loss": 0.8242, + "step": 1620 + }, + { + "epoch": 0.46, + "learning_rate": 4.371390293898007e-05, + "loss": 0.8395, + "step": 1630 + }, + { + "epoch": 0.46, + "learning_rate": 4.3639995705193684e-05, + "loss": 0.8355, + "step": 1640 + }, + { + "epoch": 0.47, + "learning_rate": 4.3565719796604706e-05, + "loss": 0.8299, + "step": 1650 + }, + { + "epoch": 0.47, + "learning_rate": 4.3491076682293715e-05, + "loss": 0.8272, + "step": 1660 + }, + { + "epoch": 0.47, + "learning_rate": 4.341606783860416e-05, + "loss": 0.8336, + "step": 1670 + }, + { + "epoch": 0.48, + "learning_rate": 4.334069474911313e-05, + "loss": 0.8264, + "step": 1680 + }, + { + "epoch": 0.48, + "learning_rate": 4.326495890460204e-05, + "loss": 0.8381, + "step": 1690 + }, + { + "epoch": 0.48, + "learning_rate": 4.3188861803027094e-05, + "loss": 0.8278, + "step": 1700 + }, + { + "epoch": 0.48, + "learning_rate": 4.3112404949489715e-05, + "loss": 0.8458, + "step": 1710 + }, + { + "epoch": 0.49, + "learning_rate": 4.303558985620673e-05, + "loss": 0.8348, + "step": 1720 + }, + { + "epoch": 0.49, + "learning_rate": 4.2958418042480506e-05, + "loss": 0.814, + "step": 1730 + }, + { + "epoch": 0.49, + "learning_rate": 4.288089103466886e-05, + "loss": 0.838, + "step": 1740 + }, + { + "epoch": 0.5, + "learning_rate": 4.280301036615489e-05, + "loss": 0.824, + "step": 1750 + }, + { + "epoch": 0.5, + "learning_rate": 4.272477757731662e-05, + "loss": 0.8314, + "step": 1760 + }, + { + "epoch": 0.5, + "learning_rate": 4.2646194215496595e-05, + "loss": 0.821, + "step": 1770 + }, + { + "epoch": 0.5, + "learning_rate": 4.2567261834971206e-05, + "loss": 0.8311, + "step": 1780 + }, + { + "epoch": 0.51, + "learning_rate": 4.248798199691998e-05, + "loss": 0.8443, + "step": 1790 + }, + { + "epoch": 0.51, + "learning_rate": 4.2408356269394714e-05, + "loss": 0.8315, + "step": 1800 + }, + { + "epoch": 0.51, + "learning_rate": 4.2328386227288445e-05, + "loss": 0.8184, + "step": 1810 + }, + { + "epoch": 0.52, + "learning_rate": 4.224807345230429e-05, + "loss": 0.8364, + "step": 1820 + }, + { + "epoch": 0.52, + "learning_rate": 4.21674195329242e-05, + "loss": 0.8186, + "step": 1830 + }, + { + "epoch": 0.52, + "learning_rate": 4.208642606437748e-05, + "loss": 0.8454, + "step": 1840 + }, + { + "epoch": 0.52, + "learning_rate": 4.2005094648609325e-05, + "loss": 0.832, + "step": 1850 + }, + { + "epoch": 0.53, + "learning_rate": 4.192342689424903e-05, + "loss": 0.8027, + "step": 1860 + }, + { + "epoch": 0.53, + "learning_rate": 4.184142441657827e-05, + "loss": 0.8365, + "step": 1870 + }, + { + "epoch": 0.53, + "learning_rate": 4.1759088837499095e-05, + "loss": 0.8523, + "step": 1880 + }, + { + "epoch": 0.54, + "learning_rate": 4.167642178550186e-05, + "loss": 0.8377, + "step": 1890 + }, + { + "epoch": 0.54, + "learning_rate": 4.159342489563304e-05, + "loss": 0.8299, + "step": 1900 + }, + { + "epoch": 0.54, + "learning_rate": 4.151009980946287e-05, + "loss": 0.8273, + "step": 1910 + }, + { + "epoch": 0.54, + "learning_rate": 4.142644817505284e-05, + "loss": 0.813, + "step": 1920 + }, + { + "epoch": 0.55, + "learning_rate": 4.1342471646923196e-05, + "loss": 0.8262, + "step": 1930 + }, + { + "epoch": 0.55, + "learning_rate": 4.1258171886020124e-05, + "loss": 0.8258, + "step": 1940 + }, + { + "epoch": 0.55, + "learning_rate": 4.117355055968295e-05, + "loss": 0.8248, + "step": 1950 + }, + { + "epoch": 0.55, + "learning_rate": 4.1088609341611135e-05, + "loss": 0.8123, + "step": 1960 + }, + { + "epoch": 0.56, + "learning_rate": 4.1003349911831166e-05, + "loss": 0.8304, + "step": 1970 + }, + { + "epoch": 0.56, + "learning_rate": 4.091777395666338e-05, + "loss": 0.849, + "step": 1980 + }, + { + "epoch": 0.56, + "learning_rate": 4.0831883168688534e-05, + "loss": 0.8255, + "step": 1990 + }, + { + "epoch": 0.57, + "learning_rate": 4.07456792467144e-05, + "loss": 0.8317, + "step": 2000 + }, + { + "epoch": 0.57, + "learning_rate": 4.065916389574211e-05, + "loss": 0.8331, + "step": 2010 + }, + { + "epoch": 0.57, + "learning_rate": 4.057233882693246e-05, + "loss": 0.8309, + "step": 2020 + }, + { + "epoch": 0.57, + "learning_rate": 4.048520575757207e-05, + "loss": 0.8117, + "step": 2030 + }, + { + "epoch": 0.58, + "learning_rate": 4.0397766411039395e-05, + "loss": 0.8155, + "step": 2040 + }, + { + "epoch": 0.58, + "learning_rate": 4.031002251677067e-05, + "loss": 0.8178, + "step": 2050 + }, + { + "epoch": 0.58, + "learning_rate": 4.022197581022567e-05, + "loss": 0.8155, + "step": 2060 + }, + { + "epoch": 0.59, + "learning_rate": 4.0133628032853435e-05, + "loss": 0.8273, + "step": 2070 + }, + { + "epoch": 0.59, + "learning_rate": 4.004498093205773e-05, + "loss": 0.8021, + "step": 2080 + }, + { + "epoch": 0.59, + "learning_rate": 3.99560362611626e-05, + "loss": 0.8374, + "step": 2090 + }, + { + "epoch": 0.59, + "learning_rate": 3.986679577937762e-05, + "loss": 0.8173, + "step": 2100 + }, + { + "epoch": 0.6, + "learning_rate": 3.9777261251763145e-05, + "loss": 0.8227, + "step": 2110 + }, + { + "epoch": 0.6, + "learning_rate": 3.9687434449195316e-05, + "loss": 0.8275, + "step": 2120 + }, + { + "epoch": 0.6, + "learning_rate": 3.959731714833115e-05, + "loss": 0.8226, + "step": 2130 + }, + { + "epoch": 0.61, + "learning_rate": 3.95069111315733e-05, + "loss": 0.815, + "step": 2140 + }, + { + "epoch": 0.61, + "learning_rate": 3.9416218187034876e-05, + "loss": 0.8306, + "step": 2150 + }, + { + "epoch": 0.61, + "learning_rate": 3.9325240108504016e-05, + "loss": 0.8424, + "step": 2160 + }, + { + "epoch": 0.61, + "learning_rate": 3.923397869540845e-05, + "loss": 0.8051, + "step": 2170 + }, + { + "epoch": 0.62, + "learning_rate": 3.91424357527799e-05, + "loss": 0.8117, + "step": 2180 + }, + { + "epoch": 0.62, + "learning_rate": 3.905061309121837e-05, + "loss": 0.8123, + "step": 2190 + }, + { + "epoch": 0.62, + "learning_rate": 3.895851252685634e-05, + "loss": 0.8038, + "step": 2200 + }, + { + "epoch": 0.63, + "learning_rate": 3.886613588132284e-05, + "loss": 0.8308, + "step": 2210 + }, + { + "epoch": 0.63, + "learning_rate": 3.877348498170743e-05, + "loss": 0.8187, + "step": 2220 + }, + { + "epoch": 0.63, + "learning_rate": 3.868056166052407e-05, + "loss": 0.8274, + "step": 2230 + }, + { + "epoch": 0.63, + "learning_rate": 3.858736775567484e-05, + "loss": 0.8171, + "step": 2240 + }, + { + "epoch": 0.64, + "learning_rate": 3.8493905110413626e-05, + "loss": 0.8213, + "step": 2250 + }, + { + "epoch": 0.64, + "learning_rate": 3.8400175573309646e-05, + "loss": 0.8241, + "step": 2260 + }, + { + "epoch": 0.64, + "learning_rate": 3.83061809982109e-05, + "loss": 0.8296, + "step": 2270 + }, + { + "epoch": 0.65, + "learning_rate": 3.821192324420747e-05, + "loss": 0.8247, + "step": 2280 + }, + { + "epoch": 0.65, + "learning_rate": 3.8117404175594795e-05, + "loss": 0.8399, + "step": 2290 + }, + { + "epoch": 0.65, + "learning_rate": 3.8022625661836775e-05, + "loss": 0.8015, + "step": 2300 + }, + { + "epoch": 0.65, + "learning_rate": 3.792758957752879e-05, + "loss": 0.8204, + "step": 2310 + }, + { + "epoch": 0.66, + "learning_rate": 3.783229780236062e-05, + "loss": 0.8198, + "step": 2320 + }, + { + "epoch": 0.66, + "learning_rate": 3.773675222107929e-05, + "loss": 0.8045, + "step": 2330 + }, + { + "epoch": 0.66, + "learning_rate": 3.7640954723451784e-05, + "loss": 0.8185, + "step": 2340 + }, + { + "epoch": 0.67, + "learning_rate": 3.7544907204227646e-05, + "loss": 0.8123, + "step": 2350 + }, + { + "epoch": 0.67, + "learning_rate": 3.7448611563101536e-05, + "loss": 0.8093, + "step": 2360 + }, + { + "epoch": 0.67, + "learning_rate": 3.735206970467564e-05, + "loss": 0.8194, + "step": 2370 + }, + { + "epoch": 0.67, + "learning_rate": 3.7255283538421984e-05, + "loss": 0.8121, + "step": 2380 + }, + { + "epoch": 0.68, + "learning_rate": 3.7158254978644703e-05, + "loss": 0.811, + "step": 2390 + }, + { + "epoch": 0.68, + "learning_rate": 3.706098594444216e-05, + "loss": 0.8013, + "step": 2400 + }, + { + "epoch": 0.68, + "learning_rate": 3.6963478359668966e-05, + "loss": 0.8215, + "step": 2410 + }, + { + "epoch": 0.69, + "learning_rate": 3.6865734152897987e-05, + "loss": 0.8079, + "step": 2420 + }, + { + "epoch": 0.69, + "learning_rate": 3.676775525738213e-05, + "loss": 0.821, + "step": 2430 + }, + { + "epoch": 0.69, + "learning_rate": 3.666954361101616e-05, + "loss": 0.8097, + "step": 2440 + }, + { + "epoch": 0.69, + "learning_rate": 3.657110115629832e-05, + "loss": 0.8046, + "step": 2450 + }, + { + "epoch": 0.7, + "learning_rate": 3.647242984029201e-05, + "loss": 0.8112, + "step": 2460 + }, + { + "epoch": 0.7, + "learning_rate": 3.637353161458713e-05, + "loss": 0.8099, + "step": 2470 + }, + { + "epoch": 0.7, + "learning_rate": 3.627440843526158e-05, + "loss": 0.8148, + "step": 2480 + }, + { + "epoch": 0.7, + "learning_rate": 3.6175062262842585e-05, + "loss": 0.8105, + "step": 2490 + }, + { + "epoch": 0.71, + "learning_rate": 3.607549506226784e-05, + "loss": 0.8132, + "step": 2500 + }, + { + "epoch": 0.71, + "learning_rate": 3.5975708802846725e-05, + "loss": 0.8149, + "step": 2510 + }, + { + "epoch": 0.71, + "learning_rate": 3.587570545822128e-05, + "loss": 0.8306, + "step": 2520 + }, + { + "epoch": 0.72, + "learning_rate": 3.5775487006327215e-05, + "loss": 0.8106, + "step": 2530 + }, + { + "epoch": 0.72, + "learning_rate": 3.567505542935482e-05, + "loss": 0.8192, + "step": 2540 + }, + { + "epoch": 0.72, + "learning_rate": 3.557441271370968e-05, + "loss": 0.8129, + "step": 2550 + }, + { + "epoch": 0.72, + "learning_rate": 3.547356084997344e-05, + "loss": 0.8155, + "step": 2560 + }, + { + "epoch": 0.73, + "learning_rate": 3.537250183286443e-05, + "loss": 0.8039, + "step": 2570 + }, + { + "epoch": 0.73, + "learning_rate": 3.527123766119818e-05, + "loss": 0.8109, + "step": 2580 + }, + { + "epoch": 0.73, + "learning_rate": 3.5169770337847935e-05, + "loss": 0.8063, + "step": 2590 + }, + { + "epoch": 0.74, + "learning_rate": 3.5068101869705004e-05, + "loss": 0.8275, + "step": 2600 + }, + { + "epoch": 0.74, + "learning_rate": 3.496623426763908e-05, + "loss": 0.8107, + "step": 2610 + }, + { + "epoch": 0.74, + "learning_rate": 3.486416954645846e-05, + "loss": 0.8047, + "step": 2620 + }, + { + "epoch": 0.74, + "learning_rate": 3.4761909724870205e-05, + "loss": 0.8123, + "step": 2630 + }, + { + "epoch": 0.75, + "learning_rate": 3.4659456825440216e-05, + "loss": 0.8241, + "step": 2640 + }, + { + "epoch": 0.75, + "learning_rate": 3.4556812874553204e-05, + "loss": 0.812, + "step": 2650 + }, + { + "epoch": 0.75, + "learning_rate": 3.445397990237264e-05, + "loss": 0.8161, + "step": 2660 + }, + { + "epoch": 0.76, + "learning_rate": 3.4350959942800584e-05, + "loss": 0.797, + "step": 2670 + }, + { + "epoch": 0.76, + "learning_rate": 3.424775503343747e-05, + "loss": 0.8155, + "step": 2680 + }, + { + "epoch": 0.76, + "learning_rate": 3.414436721554179e-05, + "loss": 0.797, + "step": 2690 + }, + { + "epoch": 0.76, + "learning_rate": 3.4040798533989745e-05, + "loss": 0.8153, + "step": 2700 + }, + { + "epoch": 0.77, + "learning_rate": 3.3937051037234745e-05, + "loss": 0.8016, + "step": 2710 + }, + { + "epoch": 0.77, + "learning_rate": 3.3833126777266974e-05, + "loss": 0.8138, + "step": 2720 + }, + { + "epoch": 0.77, + "learning_rate": 3.3729027809572735e-05, + "loss": 0.8178, + "step": 2730 + }, + { + "epoch": 0.78, + "learning_rate": 3.3624756193093835e-05, + "loss": 0.8062, + "step": 2740 + }, + { + "epoch": 0.78, + "learning_rate": 3.3520313990186856e-05, + "loss": 0.8101, + "step": 2750 + }, + { + "epoch": 0.78, + "learning_rate": 3.341570326658232e-05, + "loss": 0.7982, + "step": 2760 + }, + { + "epoch": 0.78, + "learning_rate": 3.331092609134392e-05, + "loss": 0.8021, + "step": 2770 + }, + { + "epoch": 0.79, + "learning_rate": 3.32059845368275e-05, + "loss": 0.817, + "step": 2780 + }, + { + "epoch": 0.79, + "learning_rate": 3.310088067864015e-05, + "loss": 0.8083, + "step": 2790 + }, + { + "epoch": 0.79, + "learning_rate": 3.299561659559909e-05, + "loss": 0.8047, + "step": 2800 + }, + { + "epoch": 0.8, + "learning_rate": 3.289019436969057e-05, + "loss": 0.8, + "step": 2810 + }, + { + "epoch": 0.8, + "learning_rate": 3.278461608602873e-05, + "loss": 0.8063, + "step": 2820 + }, + { + "epoch": 0.8, + "learning_rate": 3.267888383281431e-05, + "loss": 0.8139, + "step": 2830 + }, + { + "epoch": 0.8, + "learning_rate": 3.257299970129336e-05, + "loss": 0.8075, + "step": 2840 + }, + { + "epoch": 0.81, + "learning_rate": 3.246696578571592e-05, + "loss": 0.8056, + "step": 2850 + }, + { + "epoch": 0.81, + "learning_rate": 3.236078418329452e-05, + "loss": 0.8242, + "step": 2860 + }, + { + "epoch": 0.81, + "learning_rate": 3.225445699416276e-05, + "loss": 0.8041, + "step": 2870 + }, + { + "epoch": 0.82, + "learning_rate": 3.214798632133376e-05, + "loss": 0.8088, + "step": 2880 + }, + { + "epoch": 0.82, + "learning_rate": 3.204137427065857e-05, + "loss": 0.8121, + "step": 2890 + }, + { + "epoch": 0.82, + "learning_rate": 3.193462295078448e-05, + "loss": 0.8151, + "step": 2900 + }, + { + "epoch": 0.82, + "learning_rate": 3.1827734473113356e-05, + "loss": 0.8064, + "step": 2910 + }, + { + "epoch": 0.83, + "learning_rate": 3.172071095175989e-05, + "loss": 0.8151, + "step": 2920 + }, + { + "epoch": 0.83, + "learning_rate": 3.1613554503509715e-05, + "loss": 0.7942, + "step": 2930 + }, + { + "epoch": 0.83, + "learning_rate": 3.1506267247777645e-05, + "loss": 0.8131, + "step": 2940 + }, + { + "epoch": 0.84, + "learning_rate": 3.139885130656563e-05, + "loss": 0.8015, + "step": 2950 + }, + { + "epoch": 0.84, + "learning_rate": 3.129130880442091e-05, + "loss": 0.8053, + "step": 2960 + }, + { + "epoch": 0.84, + "learning_rate": 3.118364186839389e-05, + "loss": 0.7986, + "step": 2970 + }, + { + "epoch": 0.84, + "learning_rate": 3.107585262799613e-05, + "loss": 0.7936, + "step": 2980 + }, + { + "epoch": 0.85, + "learning_rate": 3.096794321515823e-05, + "loss": 0.8235, + "step": 2990 + }, + { + "epoch": 0.85, + "learning_rate": 3.0859915764187616e-05, + "loss": 0.8083, + "step": 3000 + }, + { + "epoch": 0.85, + "learning_rate": 3.075177241172637e-05, + "loss": 0.8081, + "step": 3010 + }, + { + "epoch": 0.86, + "learning_rate": 3.064351529670895e-05, + "loss": 0.7981, + "step": 3020 + }, + { + "epoch": 0.86, + "learning_rate": 3.0535146560319895e-05, + "loss": 0.8152, + "step": 3030 + }, + { + "epoch": 0.86, + "learning_rate": 3.0426668345951448e-05, + "loss": 0.8091, + "step": 3040 + }, + { + "epoch": 0.86, + "learning_rate": 3.031808279916121e-05, + "loss": 0.8206, + "step": 3050 + }, + { + "epoch": 0.87, + "learning_rate": 3.0209392067629676e-05, + "loss": 0.7947, + "step": 3060 + }, + { + "epoch": 0.87, + "learning_rate": 3.010059830111773e-05, + "loss": 0.8116, + "step": 3070 + }, + { + "epoch": 0.87, + "learning_rate": 2.9991703651424184e-05, + "loss": 0.8135, + "step": 3080 + }, + { + "epoch": 0.87, + "learning_rate": 2.988271027234317e-05, + "loss": 0.8032, + "step": 3090 + }, + { + "epoch": 0.88, + "learning_rate": 2.977362031962158e-05, + "loss": 0.8023, + "step": 3100 + }, + { + "epoch": 0.88, + "learning_rate": 2.966443595091637e-05, + "loss": 0.8116, + "step": 3110 + }, + { + "epoch": 0.88, + "learning_rate": 2.9555159325751947e-05, + "loss": 0.8048, + "step": 3120 + }, + { + "epoch": 0.89, + "learning_rate": 2.9445792605477433e-05, + "loss": 0.8032, + "step": 3130 + }, + { + "epoch": 0.89, + "learning_rate": 2.933633795322391e-05, + "loss": 0.808, + "step": 3140 + }, + { + "epoch": 0.89, + "learning_rate": 2.9226797533861615e-05, + "loss": 0.8057, + "step": 3150 + }, + { + "epoch": 0.89, + "learning_rate": 2.9117173513957186e-05, + "loss": 0.8013, + "step": 3160 + }, + { + "epoch": 0.9, + "learning_rate": 2.900746806173074e-05, + "loss": 0.802, + "step": 3170 + }, + { + "epoch": 0.9, + "learning_rate": 2.889768334701305e-05, + "loss": 0.804, + "step": 3180 + }, + { + "epoch": 0.9, + "learning_rate": 2.8787821541202564e-05, + "loss": 0.8, + "step": 3190 + }, + { + "epoch": 0.91, + "learning_rate": 2.8677884817222505e-05, + "loss": 0.7983, + "step": 3200 + }, + { + "epoch": 0.91, + "learning_rate": 2.856787534947789e-05, + "loss": 0.8083, + "step": 3210 + }, + { + "epoch": 0.91, + "learning_rate": 2.8457795313812507e-05, + "loss": 0.8203, + "step": 3220 + }, + { + "epoch": 0.91, + "learning_rate": 2.8347646887465867e-05, + "loss": 0.792, + "step": 3230 + }, + { + "epoch": 0.92, + "learning_rate": 2.8237432249030183e-05, + "loss": 0.8006, + "step": 3240 + }, + { + "epoch": 0.92, + "learning_rate": 2.812715357840725e-05, + "loss": 0.7953, + "step": 3250 + }, + { + "epoch": 0.92, + "learning_rate": 2.801681305676534e-05, + "loss": 0.8057, + "step": 3260 + }, + { + "epoch": 0.93, + "learning_rate": 2.7906412866496034e-05, + "loss": 0.8005, + "step": 3270 + }, + { + "epoch": 0.93, + "learning_rate": 2.7795955191171114e-05, + "loss": 0.8082, + "step": 3280 + }, + { + "epoch": 0.93, + "learning_rate": 2.7685442215499323e-05, + "loss": 0.811, + "step": 3290 + }, + { + "epoch": 0.93, + "learning_rate": 2.7574876125283176e-05, + "loss": 0.7981, + "step": 3300 + }, + { + "epoch": 0.94, + "learning_rate": 2.7464259107375722e-05, + "loss": 0.8018, + "step": 3310 + }, + { + "epoch": 0.94, + "learning_rate": 2.7353593349637297e-05, + "loss": 0.7991, + "step": 3320 + }, + { + "epoch": 0.94, + "learning_rate": 2.7242881040892255e-05, + "loss": 0.8057, + "step": 3330 + }, + { + "epoch": 0.95, + "learning_rate": 2.713212437088564e-05, + "loss": 0.8156, + "step": 3340 + }, + { + "epoch": 0.95, + "learning_rate": 2.702132553023993e-05, + "loss": 0.8003, + "step": 3350 + }, + { + "epoch": 0.95, + "learning_rate": 2.691048671041169e-05, + "loss": 0.7976, + "step": 3360 + }, + { + "epoch": 0.95, + "learning_rate": 2.6799610103648197e-05, + "loss": 0.7894, + "step": 3370 + }, + { + "epoch": 0.96, + "learning_rate": 2.668869790294411e-05, + "loss": 0.7953, + "step": 3380 + }, + { + "epoch": 0.96, + "learning_rate": 2.6577752301998098e-05, + "loss": 0.8124, + "step": 3390 + }, + { + "epoch": 0.96, + "learning_rate": 2.6466775495169437e-05, + "loss": 0.8073, + "step": 3400 + }, + { + "epoch": 0.97, + "learning_rate": 2.6355769677434628e-05, + "loss": 0.7979, + "step": 3410 + }, + { + "epoch": 0.97, + "learning_rate": 2.6244737044343954e-05, + "loss": 0.8023, + "step": 3420 + }, + { + "epoch": 0.97, + "learning_rate": 2.6133679791978065e-05, + "loss": 0.8046, + "step": 3430 + }, + { + "epoch": 0.97, + "learning_rate": 2.602260011690457e-05, + "loss": 0.8082, + "step": 3440 + }, + { + "epoch": 0.98, + "learning_rate": 2.591150021613456e-05, + "loss": 0.7868, + "step": 3450 + }, + { + "epoch": 0.98, + "learning_rate": 2.580038228707916e-05, + "loss": 0.7938, + "step": 3460 + }, + { + "epoch": 0.98, + "learning_rate": 2.568924852750607e-05, + "loss": 0.8215, + "step": 3470 + }, + { + "epoch": 0.99, + "learning_rate": 2.55781011354961e-05, + "loss": 0.807, + "step": 3480 + }, + { + "epoch": 0.99, + "learning_rate": 2.5466942309399706e-05, + "loss": 0.7878, + "step": 3490 + }, + { + "epoch": 0.99, + "learning_rate": 2.535577424779347e-05, + "loss": 0.7968, + "step": 3500 + }, + { + "epoch": 0.99, + "learning_rate": 2.5244599149436642e-05, + "loss": 0.787, + "step": 3510 + }, + { + "epoch": 1.0, + "learning_rate": 2.5133419213227684e-05, + "loss": 0.8011, + "step": 3520 + }, + { + "epoch": 1.0, + "learning_rate": 2.5022236638160712e-05, + "loss": 0.8086, + "step": 3530 + }, + { + "epoch": 1.0, + "learning_rate": 2.491105362328204e-05, + "loss": 0.8125, + "step": 3540 + }, + { + "epoch": 1.01, + "learning_rate": 2.4799872367646685e-05, + "loss": 0.8125, + "step": 3550 + }, + { + "epoch": 1.01, + "learning_rate": 2.468869507027486e-05, + "loss": 0.7805, + "step": 3560 + }, + { + "epoch": 1.01, + "learning_rate": 2.457752393010851e-05, + "loss": 0.817, + "step": 3570 + }, + { + "epoch": 1.01, + "learning_rate": 2.4466361145967782e-05, + "loss": 0.8056, + "step": 3580 + }, + { + "epoch": 1.02, + "learning_rate": 2.4355208916507554e-05, + "loss": 0.7752, + "step": 3590 + }, + { + "epoch": 1.02, + "learning_rate": 2.4244069440173938e-05, + "loss": 0.7749, + "step": 3600 + }, + { + "epoch": 1.02, + "learning_rate": 2.413294491516083e-05, + "loss": 0.8073, + "step": 3610 + }, + { + "epoch": 1.02, + "learning_rate": 2.402183753936639e-05, + "loss": 0.8117, + "step": 3620 + }, + { + "epoch": 1.03, + "learning_rate": 2.3910749510349574e-05, + "loss": 0.8008, + "step": 3630 + }, + { + "epoch": 1.03, + "learning_rate": 2.3799683025286727e-05, + "loss": 0.8028, + "step": 3640 + }, + { + "epoch": 1.03, + "learning_rate": 2.3688640280928043e-05, + "loss": 0.7974, + "step": 3650 + }, + { + "epoch": 1.04, + "learning_rate": 2.357762347355418e-05, + "loss": 0.7867, + "step": 3660 + }, + { + "epoch": 1.04, + "learning_rate": 2.346663479893277e-05, + "loss": 0.8002, + "step": 3670 + }, + { + "epoch": 1.04, + "learning_rate": 2.3355676452275057e-05, + "loss": 0.8095, + "step": 3680 + }, + { + "epoch": 1.04, + "learning_rate": 2.3244750628192395e-05, + "loss": 0.7847, + "step": 3690 + }, + { + "epoch": 1.05, + "learning_rate": 2.313385952065291e-05, + "loss": 0.7693, + "step": 3700 + }, + { + "epoch": 1.05, + "learning_rate": 2.302300532293806e-05, + "loss": 0.8078, + "step": 3710 + }, + { + "epoch": 1.05, + "learning_rate": 2.2912190227599305e-05, + "loss": 0.7925, + "step": 3720 + }, + { + "epoch": 1.06, + "learning_rate": 2.280141642641468e-05, + "loss": 0.77, + "step": 3730 + }, + { + "epoch": 1.06, + "learning_rate": 2.26906861103455e-05, + "loss": 0.7962, + "step": 3740 + }, + { + "epoch": 1.06, + "learning_rate": 2.2580001469492968e-05, + "loss": 0.8014, + "step": 3750 + }, + { + "epoch": 1.06, + "learning_rate": 2.2469364693054938e-05, + "loss": 0.7934, + "step": 3760 + }, + { + "epoch": 1.07, + "learning_rate": 2.235877796928252e-05, + "loss": 0.7978, + "step": 3770 + }, + { + "epoch": 1.07, + "learning_rate": 2.2248243485436892e-05, + "loss": 0.8022, + "step": 3780 + }, + { + "epoch": 1.07, + "learning_rate": 2.213776342774595e-05, + "loss": 0.7934, + "step": 3790 + }, + { + "epoch": 1.08, + "learning_rate": 2.2027339981361156e-05, + "loss": 0.7975, + "step": 3800 + }, + { + "epoch": 1.08, + "learning_rate": 2.1916975330314235e-05, + "loss": 0.807, + "step": 3810 + }, + { + "epoch": 1.08, + "learning_rate": 2.1806671657474048e-05, + "loss": 0.7754, + "step": 3820 + }, + { + "epoch": 1.08, + "learning_rate": 2.1696431144503356e-05, + "loss": 0.7977, + "step": 3830 + }, + { + "epoch": 1.09, + "learning_rate": 2.1586255971815738e-05, + "loss": 0.7922, + "step": 3840 + }, + { + "epoch": 1.09, + "learning_rate": 2.147614831853239e-05, + "loss": 0.7862, + "step": 3850 + }, + { + "epoch": 1.09, + "learning_rate": 2.136611036243908e-05, + "loss": 0.7918, + "step": 3860 + }, + { + "epoch": 1.1, + "learning_rate": 2.1256144279943066e-05, + "loss": 0.781, + "step": 3870 + }, + { + "epoch": 1.1, + "learning_rate": 2.114625224603002e-05, + "loss": 0.7786, + "step": 3880 + }, + { + "epoch": 1.1, + "learning_rate": 2.1036436434221048e-05, + "loss": 0.8067, + "step": 3890 + }, + { + "epoch": 1.1, + "learning_rate": 2.0926699016529656e-05, + "loss": 0.7755, + "step": 3900 + }, + { + "epoch": 1.11, + "learning_rate": 2.0817042163418858e-05, + "loss": 0.7958, + "step": 3910 + }, + { + "epoch": 1.11, + "learning_rate": 2.0707468043758156e-05, + "loss": 0.8064, + "step": 3920 + }, + { + "epoch": 1.11, + "learning_rate": 2.059797882478074e-05, + "loss": 0.7967, + "step": 3930 + }, + { + "epoch": 1.12, + "learning_rate": 2.048857667204053e-05, + "loss": 0.8107, + "step": 3940 + }, + { + "epoch": 1.12, + "learning_rate": 2.0379263749369434e-05, + "loss": 0.7857, + "step": 3950 + }, + { + "epoch": 1.12, + "learning_rate": 2.027004221883447e-05, + "loss": 0.7732, + "step": 3960 + }, + { + "epoch": 1.12, + "learning_rate": 2.016091424069506e-05, + "loss": 0.7768, + "step": 3970 + }, + { + "epoch": 1.13, + "learning_rate": 2.0051881973360266e-05, + "loss": 0.7839, + "step": 3980 + }, + { + "epoch": 1.13, + "learning_rate": 1.9942947573346133e-05, + "loss": 0.7923, + "step": 3990 + }, + { + "epoch": 1.13, + "learning_rate": 1.9834113195233e-05, + "loss": 0.7994, + "step": 4000 + }, + { + "epoch": 1.14, + "learning_rate": 1.9725380991622923e-05, + "loss": 0.7907, + "step": 4010 + }, + { + "epoch": 1.14, + "learning_rate": 1.961675311309705e-05, + "loss": 0.7908, + "step": 4020 + }, + { + "epoch": 1.14, + "learning_rate": 1.9508231708173146e-05, + "loss": 0.7731, + "step": 4030 + }, + { + "epoch": 1.14, + "learning_rate": 1.9399818923263056e-05, + "loss": 0.7769, + "step": 4040 + }, + { + "epoch": 1.15, + "learning_rate": 1.929151690263026e-05, + "loss": 0.795, + "step": 4050 + }, + { + "epoch": 1.15, + "learning_rate": 1.918332778834745e-05, + "loss": 0.8147, + "step": 4060 + }, + { + "epoch": 1.15, + "learning_rate": 1.9075253720254217e-05, + "loss": 0.8065, + "step": 4070 + }, + { + "epoch": 1.16, + "learning_rate": 1.8967296835914643e-05, + "loss": 0.7879, + "step": 4080 + }, + { + "epoch": 1.16, + "learning_rate": 1.885945927057511e-05, + "loss": 0.7755, + "step": 4090 + }, + { + "epoch": 1.16, + "learning_rate": 1.8751743157122003e-05, + "loss": 0.7852, + "step": 4100 + }, + { + "epoch": 1.16, + "learning_rate": 1.8644150626039534e-05, + "loss": 0.7912, + "step": 4110 + }, + { + "epoch": 1.17, + "learning_rate": 1.8536683805367656e-05, + "loss": 0.7934, + "step": 4120 + }, + { + "epoch": 1.17, + "learning_rate": 1.8429344820659892e-05, + "loss": 0.7966, + "step": 4130 + }, + { + "epoch": 1.17, + "learning_rate": 1.832213579494137e-05, + "loss": 0.7976, + "step": 4140 + }, + { + "epoch": 1.17, + "learning_rate": 1.8215058848666765e-05, + "loss": 0.7843, + "step": 4150 + }, + { + "epoch": 1.18, + "learning_rate": 1.810811609967844e-05, + "loss": 0.7848, + "step": 4160 + }, + { + "epoch": 1.18, + "learning_rate": 1.8001309663164457e-05, + "loss": 0.7675, + "step": 4170 + }, + { + "epoch": 1.18, + "learning_rate": 1.7894641651616838e-05, + "loss": 0.8059, + "step": 4180 + }, + { + "epoch": 1.19, + "learning_rate": 1.7788114174789706e-05, + "loss": 0.7871, + "step": 4190 + }, + { + "epoch": 1.19, + "learning_rate": 1.7681729339657626e-05, + "loss": 0.776, + "step": 4200 + }, + { + "epoch": 1.19, + "learning_rate": 1.7575489250373867e-05, + "loss": 0.7911, + "step": 4210 + }, + { + "epoch": 1.19, + "learning_rate": 1.746939600822883e-05, + "loss": 0.7934, + "step": 4220 + }, + { + "epoch": 1.2, + "learning_rate": 1.7363451711608445e-05, + "loss": 0.7922, + "step": 4230 + }, + { + "epoch": 1.2, + "learning_rate": 1.7257658455952747e-05, + "loss": 0.7931, + "step": 4240 + }, + { + "epoch": 1.2, + "learning_rate": 1.715201833371432e-05, + "loss": 0.7926, + "step": 4250 + }, + { + "epoch": 1.21, + "learning_rate": 1.7046533434317008e-05, + "loss": 0.7881, + "step": 4260 + }, + { + "epoch": 1.21, + "learning_rate": 1.6941205844114522e-05, + "loss": 0.7842, + "step": 4270 + }, + { + "epoch": 1.21, + "learning_rate": 1.683603764634923e-05, + "loss": 0.7807, + "step": 4280 + }, + { + "epoch": 1.21, + "learning_rate": 1.6731030921110903e-05, + "loss": 0.7926, + "step": 4290 + }, + { + "epoch": 1.22, + "learning_rate": 1.6626187745295608e-05, + "loss": 0.7878, + "step": 4300 + }, + { + "epoch": 1.22, + "learning_rate": 1.65215101925646e-05, + "loss": 0.7843, + "step": 4310 + }, + { + "epoch": 1.22, + "learning_rate": 1.641700033330336e-05, + "loss": 0.7748, + "step": 4320 + }, + { + "epoch": 1.23, + "learning_rate": 1.6312660234580585e-05, + "loss": 0.802, + "step": 4330 + }, + { + "epoch": 1.23, + "learning_rate": 1.6208491960107324e-05, + "loss": 0.7864, + "step": 4340 + }, + { + "epoch": 1.23, + "learning_rate": 1.6104497570196193e-05, + "loss": 0.7884, + "step": 4350 + }, + { + "epoch": 1.23, + "learning_rate": 1.600067912172057e-05, + "loss": 0.7832, + "step": 4360 + }, + { + "epoch": 1.24, + "learning_rate": 1.5897038668073965e-05, + "loss": 0.8039, + "step": 4370 + }, + { + "epoch": 1.24, + "learning_rate": 1.5793578259129355e-05, + "loss": 0.7737, + "step": 4380 + }, + { + "epoch": 1.24, + "learning_rate": 1.5690299941198706e-05, + "loss": 0.7844, + "step": 4390 + }, + { + "epoch": 1.25, + "learning_rate": 1.558720575699242e-05, + "loss": 0.7865, + "step": 4400 + }, + { + "epoch": 1.25, + "learning_rate": 1.548429774557901e-05, + "loss": 0.7983, + "step": 4410 + }, + { + "epoch": 1.25, + "learning_rate": 1.5381577942344688e-05, + "loss": 0.7851, + "step": 4420 + }, + { + "epoch": 1.25, + "learning_rate": 1.5279048378953222e-05, + "loss": 0.7798, + "step": 4430 + }, + { + "epoch": 1.26, + "learning_rate": 1.517671108330561e-05, + "loss": 0.79, + "step": 4440 + }, + { + "epoch": 1.26, + "learning_rate": 1.5074568079500109e-05, + "loss": 0.7694, + "step": 4450 + }, + { + "epoch": 1.26, + "learning_rate": 1.497262138779208e-05, + "loss": 0.7874, + "step": 4460 + }, + { + "epoch": 1.27, + "learning_rate": 1.4870873024554138e-05, + "loss": 0.7878, + "step": 4470 + }, + { + "epoch": 1.27, + "learning_rate": 1.4769325002236183e-05, + "loss": 0.7992, + "step": 4480 + }, + { + "epoch": 1.27, + "learning_rate": 1.4667979329325651e-05, + "loss": 0.8003, + "step": 4490 + }, + { + "epoch": 1.27, + "learning_rate": 1.4566838010307754e-05, + "loss": 0.7778, + "step": 4500 + }, + { + "epoch": 1.28, + "learning_rate": 1.4465903045625878e-05, + "loss": 0.773, + "step": 4510 + }, + { + "epoch": 1.28, + "learning_rate": 1.4365176431641958e-05, + "loss": 0.7872, + "step": 4520 + }, + { + "epoch": 1.28, + "learning_rate": 1.4264660160597057e-05, + "loss": 0.7977, + "step": 4530 + }, + { + "epoch": 1.29, + "learning_rate": 1.41643562205719e-05, + "loss": 0.7792, + "step": 4540 + }, + { + "epoch": 1.29, + "learning_rate": 1.4064266595447584e-05, + "loss": 0.7792, + "step": 4550 + }, + { + "epoch": 1.29, + "learning_rate": 1.3964393264866368e-05, + "loss": 0.7836, + "step": 4560 + }, + { + "epoch": 1.29, + "learning_rate": 1.386473820419244e-05, + "loss": 0.8005, + "step": 4570 + }, + { + "epoch": 1.3, + "learning_rate": 1.376530338447294e-05, + "loss": 0.7937, + "step": 4580 + }, + { + "epoch": 1.3, + "learning_rate": 1.366609077239889e-05, + "loss": 0.7692, + "step": 4590 + }, + { + "epoch": 1.3, + "learning_rate": 1.3567102330266369e-05, + "loss": 0.7926, + "step": 4600 + }, + { + "epoch": 1.31, + "learning_rate": 1.3468340015937642e-05, + "loss": 0.7725, + "step": 4610 + }, + { + "epoch": 1.31, + "learning_rate": 1.3369805782802467e-05, + "loss": 0.7936, + "step": 4620 + }, + { + "epoch": 1.31, + "learning_rate": 1.3271501579739449e-05, + "loss": 0.7776, + "step": 4630 + }, + { + "epoch": 1.31, + "learning_rate": 1.317342935107752e-05, + "loss": 0.7785, + "step": 4640 + }, + { + "epoch": 1.32, + "learning_rate": 1.307559103655743e-05, + "loss": 0.7735, + "step": 4650 + }, + { + "epoch": 1.32, + "learning_rate": 1.2977988571293447e-05, + "loss": 0.7925, + "step": 4660 + }, + { + "epoch": 1.32, + "learning_rate": 1.288062388573501e-05, + "loss": 0.7846, + "step": 4670 + }, + { + "epoch": 1.33, + "learning_rate": 1.2783498905628622e-05, + "loss": 0.7782, + "step": 4680 + }, + { + "epoch": 1.33, + "learning_rate": 1.2696292959503922e-05, + "loss": 0.7888, + "step": 4690 + }, + { + "epoch": 1.33, + "learning_rate": 1.2599628708177253e-05, + "loss": 0.7898, + "step": 4700 + }, + { + "epoch": 1.33, + "learning_rate": 1.250320972002072e-05, + "loss": 0.7956, + "step": 4710 + }, + { + "epoch": 1.34, + "learning_rate": 1.2407037902076168e-05, + "loss": 0.7735, + "step": 4720 + }, + { + "epoch": 1.34, + "learning_rate": 1.23111151564967e-05, + "loss": 0.7842, + "step": 4730 + }, + { + "epoch": 1.34, + "learning_rate": 1.2215443380509125e-05, + "loss": 0.7892, + "step": 4740 + }, + { + "epoch": 1.34, + "learning_rate": 1.2120024466376381e-05, + "loss": 0.7822, + "step": 4750 + }, + { + "epoch": 1.35, + "learning_rate": 1.2024860301360131e-05, + "loss": 0.7788, + "step": 4760 + }, + { + "epoch": 1.35, + "learning_rate": 1.1929952767683426e-05, + "loss": 0.7824, + "step": 4770 + }, + { + "epoch": 1.35, + "learning_rate": 1.1835303742493508e-05, + "loss": 0.7859, + "step": 4780 + }, + { + "epoch": 1.36, + "learning_rate": 1.1740915097824629e-05, + "loss": 0.7897, + "step": 4790 + }, + { + "epoch": 1.36, + "learning_rate": 1.1646788700561085e-05, + "loss": 0.768, + "step": 4800 + }, + { + "epoch": 1.36, + "learning_rate": 1.1552926412400225e-05, + "loss": 0.7935, + "step": 4810 + }, + { + "epoch": 1.36, + "learning_rate": 1.1459330089815699e-05, + "loss": 0.7933, + "step": 4820 + }, + { + "epoch": 1.37, + "learning_rate": 1.136600158402068e-05, + "loss": 0.7792, + "step": 4830 + }, + { + "epoch": 1.37, + "learning_rate": 1.1272942740931286e-05, + "loss": 0.7839, + "step": 4840 + }, + { + "epoch": 1.37, + "learning_rate": 1.1180155401130044e-05, + "loss": 0.7844, + "step": 4850 + }, + { + "epoch": 1.38, + "learning_rate": 1.1087641399829527e-05, + "loss": 0.7753, + "step": 4860 + }, + { + "epoch": 1.38, + "learning_rate": 1.0995402566835997e-05, + "loss": 0.791, + "step": 4870 + }, + { + "epoch": 1.38, + "learning_rate": 1.090344072651328e-05, + "loss": 0.7998, + "step": 4880 + }, + { + "epoch": 1.38, + "learning_rate": 1.0811757697746614e-05, + "loss": 0.7864, + "step": 4890 + }, + { + "epoch": 1.39, + "learning_rate": 1.0720355293906741e-05, + "loss": 0.7702, + "step": 4900 + }, + { + "epoch": 1.39, + "learning_rate": 1.0629235322813982e-05, + "loss": 0.7705, + "step": 4910 + }, + { + "epoch": 1.39, + "learning_rate": 1.0538399586702507e-05, + "loss": 0.7941, + "step": 4920 + }, + { + "epoch": 1.4, + "learning_rate": 1.0447849882184715e-05, + "loss": 0.7779, + "step": 4930 + }, + { + "epoch": 1.4, + "learning_rate": 1.035758800021564e-05, + "loss": 0.7755, + "step": 4940 + }, + { + "epoch": 1.4, + "learning_rate": 1.0267615726057592e-05, + "loss": 0.7825, + "step": 4950 + }, + { + "epoch": 1.4, + "learning_rate": 1.0177934839244787e-05, + "loss": 0.7983, + "step": 4960 + }, + { + "epoch": 1.41, + "learning_rate": 1.0088547113548211e-05, + "loss": 0.773, + "step": 4970 + }, + { + "epoch": 1.41, + "learning_rate": 9.99945431694048e-06, + "loss": 0.7794, + "step": 4980 + }, + { + "epoch": 1.41, + "learning_rate": 9.910658211560902e-06, + "loss": 0.7889, + "step": 4990 + }, + { + "epoch": 1.42, + "learning_rate": 9.822160553680617e-06, + "loss": 0.7809, + "step": 5000 + }, + { + "epoch": 1.42, + "learning_rate": 9.733963093667889e-06, + "loss": 0.7624, + "step": 5010 + }, + { + "epoch": 1.42, + "learning_rate": 9.646067575953419e-06, + "loss": 0.7787, + "step": 5020 + }, + { + "epoch": 1.42, + "learning_rate": 9.558475738995923e-06, + "loss": 0.775, + "step": 5030 + }, + { + "epoch": 1.43, + "learning_rate": 9.471189315247669e-06, + "loss": 0.7607, + "step": 5040 + }, + { + "epoch": 1.43, + "learning_rate": 9.384210031120288e-06, + "loss": 0.7795, + "step": 5050 + }, + { + "epoch": 1.43, + "learning_rate": 9.297539606950564e-06, + "loss": 0.7933, + "step": 5060 + }, + { + "epoch": 1.44, + "learning_rate": 9.21117975696644e-06, + "loss": 0.7859, + "step": 5070 + }, + { + "epoch": 1.44, + "learning_rate": 9.1251321892531e-06, + "loss": 0.7772, + "step": 5080 + }, + { + "epoch": 1.44, + "learning_rate": 9.039398605719215e-06, + "loss": 0.7833, + "step": 5090 + }, + { + "epoch": 1.44, + "learning_rate": 8.953980702063233e-06, + "loss": 0.7784, + "step": 5100 + }, + { + "epoch": 1.45, + "learning_rate": 8.868880167739887e-06, + "loss": 0.7835, + "step": 5110 + }, + { + "epoch": 1.45, + "learning_rate": 8.784098685926734e-06, + "loss": 0.779, + "step": 5120 + }, + { + "epoch": 1.45, + "learning_rate": 8.699637933490917e-06, + "loss": 0.7953, + "step": 5130 + }, + { + "epoch": 1.46, + "learning_rate": 8.615499580955953e-06, + "loss": 0.773, + "step": 5140 + }, + { + "epoch": 1.46, + "learning_rate": 8.531685292468693e-06, + "loss": 0.7851, + "step": 5150 + }, + { + "epoch": 1.46, + "learning_rate": 8.448196725766471e-06, + "loss": 0.7903, + "step": 5160 + }, + { + "epoch": 1.46, + "learning_rate": 8.365035532144217e-06, + "loss": 0.7822, + "step": 5170 + }, + { + "epoch": 1.47, + "learning_rate": 8.282203356421891e-06, + "loss": 0.7887, + "step": 5180 + }, + { + "epoch": 1.47, + "learning_rate": 8.199701836911877e-06, + "loss": 0.7972, + "step": 5190 + }, + { + "epoch": 1.47, + "learning_rate": 8.117532605386632e-06, + "loss": 0.7781, + "step": 5200 + }, + { + "epoch": 1.48, + "learning_rate": 8.035697287046376e-06, + "loss": 0.7885, + "step": 5210 + }, + { + "epoch": 1.48, + "learning_rate": 7.954197500486968e-06, + "loss": 0.779, + "step": 5220 + }, + { + "epoch": 1.48, + "learning_rate": 7.873034857667877e-06, + "loss": 0.779, + "step": 5230 + }, + { + "epoch": 1.48, + "learning_rate": 7.792210963880328e-06, + "loss": 0.7883, + "step": 5240 + }, + { + "epoch": 1.49, + "learning_rate": 7.711727417715509e-06, + "loss": 0.7677, + "step": 5250 + }, + { + "epoch": 1.49, + "learning_rate": 7.631585811032999e-06, + "loss": 0.7849, + "step": 5260 + }, + { + "epoch": 1.49, + "learning_rate": 7.551787728929236e-06, + "loss": 0.7707, + "step": 5270 + }, + { + "epoch": 1.49, + "learning_rate": 7.472334749706214e-06, + "loss": 0.7855, + "step": 5280 + }, + { + "epoch": 1.5, + "learning_rate": 7.393228444840228e-06, + "loss": 0.7601, + "step": 5290 + }, + { + "epoch": 1.5, + "learning_rate": 7.314470378950802e-06, + "loss": 0.7741, + "step": 5300 + }, + { + "epoch": 1.5, + "learning_rate": 7.23606210976975e-06, + "loss": 0.7733, + "step": 5310 + }, + { + "epoch": 1.51, + "learning_rate": 7.158005188110381e-06, + "loss": 0.7881, + "step": 5320 + }, + { + "epoch": 1.51, + "learning_rate": 7.080301157836783e-06, + "loss": 0.7761, + "step": 5330 + }, + { + "epoch": 1.51, + "learning_rate": 7.002951555833334e-06, + "loss": 0.7692, + "step": 5340 + }, + { + "epoch": 1.51, + "learning_rate": 6.925957911974262e-06, + "loss": 0.7656, + "step": 5350 + }, + { + "epoch": 1.52, + "learning_rate": 6.849321749093432e-06, + "loss": 0.7754, + "step": 5360 + }, + { + "epoch": 1.52, + "learning_rate": 6.773044582954172e-06, + "loss": 0.7828, + "step": 5370 + }, + { + "epoch": 1.52, + "learning_rate": 6.697127922219357e-06, + "loss": 0.779, + "step": 5380 + }, + { + "epoch": 1.53, + "learning_rate": 6.621573268421505e-06, + "loss": 0.7856, + "step": 5390 + }, + { + "epoch": 1.53, + "learning_rate": 6.546382115933117e-06, + "loss": 0.7908, + "step": 5400 + }, + { + "epoch": 1.53, + "learning_rate": 6.47155595193713e-06, + "loss": 0.7899, + "step": 5410 + }, + { + "epoch": 1.53, + "learning_rate": 6.397096256397456e-06, + "loss": 0.7736, + "step": 5420 + }, + { + "epoch": 1.54, + "learning_rate": 6.323004502029767e-06, + "loss": 0.7788, + "step": 5430 + }, + { + "epoch": 1.54, + "learning_rate": 6.249282154272315e-06, + "loss": 0.7729, + "step": 5440 + }, + { + "epoch": 1.54, + "learning_rate": 6.175930671256991e-06, + "loss": 0.7706, + "step": 5450 + }, + { + "epoch": 1.55, + "learning_rate": 6.102951503780449e-06, + "loss": 0.7915, + "step": 5460 + }, + { + "epoch": 1.55, + "learning_rate": 6.030346095275438e-06, + "loss": 0.7893, + "step": 5470 + }, + { + "epoch": 1.55, + "learning_rate": 5.958115881782228e-06, + "loss": 0.7813, + "step": 5480 + }, + { + "epoch": 1.55, + "learning_rate": 5.886262291920244e-06, + "loss": 0.793, + "step": 5490 + }, + { + "epoch": 1.56, + "learning_rate": 5.81478674685976e-06, + "loss": 0.7801, + "step": 5500 + }, + { + "epoch": 1.56, + "learning_rate": 5.7436906602938435e-06, + "loss": 0.7878, + "step": 5510 + }, + { + "epoch": 1.56, + "learning_rate": 5.672975438410344e-06, + "loss": 0.7762, + "step": 5520 + }, + { + "epoch": 1.57, + "learning_rate": 5.602642479864129e-06, + "loss": 0.7775, + "step": 5530 + }, + { + "epoch": 1.57, + "learning_rate": 5.532693175749373e-06, + "loss": 0.7689, + "step": 5540 + }, + { + "epoch": 1.57, + "learning_rate": 5.463128909572077e-06, + "loss": 0.7755, + "step": 5550 + }, + { + "epoch": 1.57, + "learning_rate": 5.393951057222685e-06, + "loss": 0.7878, + "step": 5560 + }, + { + "epoch": 1.58, + "learning_rate": 5.325160986948899e-06, + "loss": 0.7759, + "step": 5570 + }, + { + "epoch": 1.58, + "learning_rate": 5.256760059328572e-06, + "loss": 0.7698, + "step": 5580 + }, + { + "epoch": 1.58, + "learning_rate": 5.188749627242851e-06, + "loss": 0.7853, + "step": 5590 + }, + { + "epoch": 1.59, + "learning_rate": 5.121131035849361e-06, + "loss": 0.7886, + "step": 5600 + }, + { + "epoch": 1.59, + "learning_rate": 5.053905622555657e-06, + "loss": 0.7869, + "step": 5610 + }, + { + "epoch": 1.59, + "learning_rate": 4.987074716992724e-06, + "loss": 0.7882, + "step": 5620 + }, + { + "epoch": 1.59, + "learning_rate": 4.920639640988697e-06, + "loss": 0.7854, + "step": 5630 + }, + { + "epoch": 1.6, + "learning_rate": 4.854601708542747e-06, + "loss": 0.7807, + "step": 5640 + }, + { + "epoch": 1.6, + "learning_rate": 4.7889622257990205e-06, + "loss": 0.7819, + "step": 5650 + }, + { + "epoch": 1.6, + "learning_rate": 4.7237224910208935e-06, + "loss": 0.7755, + "step": 5660 + }, + { + "epoch": 1.61, + "learning_rate": 4.658883794565208e-06, + "loss": 0.7829, + "step": 5670 + }, + { + "epoch": 1.61, + "learning_rate": 4.594447418856823e-06, + "loss": 0.7761, + "step": 5680 + }, + { + "epoch": 1.61, + "learning_rate": 4.530414638363201e-06, + "loss": 0.7742, + "step": 5690 + }, + { + "epoch": 1.61, + "learning_rate": 4.466786719569221e-06, + "loss": 0.7744, + "step": 5700 + }, + { + "epoch": 1.62, + "learning_rate": 4.403564920952116e-06, + "loss": 0.78, + "step": 5710 + }, + { + "epoch": 1.62, + "learning_rate": 4.3407504929566166e-06, + "loss": 0.7847, + "step": 5720 + }, + { + "epoch": 1.62, + "learning_rate": 4.278344677970167e-06, + "loss": 0.7837, + "step": 5730 + }, + { + "epoch": 1.63, + "learning_rate": 4.216348710298401e-06, + "loss": 0.774, + "step": 5740 + }, + { + "epoch": 1.63, + "learning_rate": 4.154763816140686e-06, + "loss": 0.7826, + "step": 5750 + }, + { + "epoch": 1.63, + "learning_rate": 4.093591213565914e-06, + "loss": 0.7881, + "step": 5760 + }, + { + "epoch": 1.63, + "learning_rate": 4.032832112488369e-06, + "loss": 0.7878, + "step": 5770 + }, + { + "epoch": 1.64, + "learning_rate": 3.972487714643822e-06, + "loss": 0.7722, + "step": 5780 + }, + { + "epoch": 1.64, + "learning_rate": 3.9125592135657475e-06, + "loss": 0.7689, + "step": 5790 + }, + { + "epoch": 1.64, + "learning_rate": 3.853047794561743e-06, + "loss": 0.788, + "step": 5800 + }, + { + "epoch": 1.64, + "learning_rate": 3.7939546346900417e-06, + "loss": 0.7705, + "step": 5810 + }, + { + "epoch": 1.65, + "learning_rate": 3.7352809027362796e-06, + "loss": 0.7591, + "step": 5820 + }, + { + "epoch": 1.65, + "learning_rate": 3.6770277591903462e-06, + "loss": 0.7587, + "step": 5830 + }, + { + "epoch": 1.65, + "learning_rate": 3.619196356223439e-06, + "loss": 0.7782, + "step": 5840 + }, + { + "epoch": 1.66, + "learning_rate": 3.5617878376652785e-06, + "loss": 0.7811, + "step": 5850 + }, + { + "epoch": 1.66, + "learning_rate": 3.504803338981472e-06, + "loss": 0.786, + "step": 5860 + }, + { + "epoch": 1.66, + "learning_rate": 3.448243987251093e-06, + "loss": 0.7911, + "step": 5870 + }, + { + "epoch": 1.66, + "learning_rate": 3.3921109011443354e-06, + "loss": 0.7706, + "step": 5880 + }, + { + "epoch": 1.67, + "learning_rate": 3.336405190900438e-06, + "loss": 0.7913, + "step": 5890 + }, + { + "epoch": 1.67, + "learning_rate": 3.2811279583056825e-06, + "loss": 0.7849, + "step": 5900 + }, + { + "epoch": 1.67, + "learning_rate": 3.2262802966716383e-06, + "loss": 0.7759, + "step": 5910 + }, + { + "epoch": 1.68, + "learning_rate": 3.171863290813509e-06, + "loss": 0.8093, + "step": 5920 + }, + { + "epoch": 1.68, + "learning_rate": 3.117878017028697e-06, + "loss": 0.7634, + "step": 5930 + }, + { + "epoch": 1.68, + "learning_rate": 3.064325543075494e-06, + "loss": 0.777, + "step": 5940 + }, + { + "epoch": 1.68, + "learning_rate": 3.0112069281519994e-06, + "loss": 0.7794, + "step": 5950 + }, + { + "epoch": 1.69, + "learning_rate": 2.9585232228751204e-06, + "loss": 0.7703, + "step": 5960 + }, + { + "epoch": 1.69, + "learning_rate": 2.906275469259839e-06, + "loss": 0.7725, + "step": 5970 + }, + { + "epoch": 1.69, + "learning_rate": 2.8544647006985724e-06, + "loss": 0.7913, + "step": 5980 + }, + { + "epoch": 1.7, + "learning_rate": 2.803091941940747e-06, + "loss": 0.7897, + "step": 5990 + }, + { + "epoch": 1.7, + "learning_rate": 2.752158209072522e-06, + "loss": 0.7785, + "step": 6000 + }, + { + "epoch": 1.7, + "learning_rate": 2.701664509496701e-06, + "loss": 0.7742, + "step": 6010 + }, + { + "epoch": 1.7, + "learning_rate": 2.651611841912796e-06, + "loss": 0.7742, + "step": 6020 + }, + { + "epoch": 1.71, + "learning_rate": 2.602001196297299e-06, + "loss": 0.7947, + "step": 6030 + }, + { + "epoch": 1.71, + "learning_rate": 2.5528335538840597e-06, + "loss": 0.7842, + "step": 6040 + }, + { + "epoch": 1.71, + "learning_rate": 2.5041098871449204e-06, + "loss": 0.7738, + "step": 6050 + }, + { + "epoch": 1.72, + "learning_rate": 2.4558311597704636e-06, + "loss": 0.778, + "step": 6060 + }, + { + "epoch": 1.72, + "learning_rate": 2.40799832665094e-06, + "loss": 0.772, + "step": 6070 + }, + { + "epoch": 1.72, + "learning_rate": 2.360612333857401e-06, + "loss": 0.7742, + "step": 6080 + }, + { + "epoch": 1.72, + "learning_rate": 2.31367411862298e-06, + "loss": 0.7846, + "step": 6090 + }, + { + "epoch": 1.73, + "learning_rate": 2.2671846093243493e-06, + "loss": 0.785, + "step": 6100 + }, + { + "epoch": 1.73, + "learning_rate": 2.221144725463359e-06, + "loss": 0.7846, + "step": 6110 + }, + { + "epoch": 1.73, + "learning_rate": 2.1755553776488745e-06, + "loss": 0.797, + "step": 6120 + }, + { + "epoch": 1.74, + "learning_rate": 2.130417467578724e-06, + "loss": 0.7936, + "step": 6130 + }, + { + "epoch": 1.74, + "learning_rate": 2.0857318880218995e-06, + "loss": 0.7785, + "step": 6140 + }, + { + "epoch": 1.74, + "learning_rate": 2.0414995228008743e-06, + "loss": 0.7619, + "step": 6150 + }, + { + "epoch": 1.74, + "learning_rate": 1.997721246774145e-06, + "loss": 0.7624, + "step": 6160 + }, + { + "epoch": 1.75, + "learning_rate": 1.9543979258189126e-06, + "loss": 0.7682, + "step": 6170 + }, + { + "epoch": 1.75, + "learning_rate": 1.911530416813953e-06, + "loss": 0.7834, + "step": 6180 + }, + { + "epoch": 1.75, + "learning_rate": 1.869119567622679e-06, + "loss": 0.7947, + "step": 6190 + }, + { + "epoch": 1.76, + "learning_rate": 1.8271662170763787e-06, + "loss": 0.8014, + "step": 6200 + }, + { + "epoch": 1.76, + "learning_rate": 1.7856711949575972e-06, + "loss": 0.7769, + "step": 6210 + }, + { + "epoch": 1.76, + "learning_rate": 1.7446353219837592e-06, + "loss": 0.7804, + "step": 6220 + }, + { + "epoch": 1.76, + "learning_rate": 1.704059409790898e-06, + "loss": 0.787, + "step": 6230 + }, + { + "epoch": 1.77, + "learning_rate": 1.6639442609176409e-06, + "loss": 0.7745, + "step": 6240 + }, + { + "epoch": 1.77, + "learning_rate": 1.6242906687893077e-06, + "loss": 0.7888, + "step": 6250 + }, + { + "epoch": 1.77, + "learning_rate": 1.5850994177022265e-06, + "loss": 0.7949, + "step": 6260 + }, + { + "epoch": 1.78, + "learning_rate": 1.546371282808226e-06, + "loss": 0.7702, + "step": 6270 + }, + { + "epoch": 1.78, + "learning_rate": 1.508107030099304e-06, + "loss": 0.7911, + "step": 6280 + }, + { + "epoch": 1.78, + "learning_rate": 1.4703074163924718e-06, + "loss": 0.7807, + "step": 6290 + }, + { + "epoch": 1.78, + "learning_rate": 1.4329731893147792e-06, + "loss": 0.7797, + "step": 6300 + }, + { + "epoch": 1.79, + "learning_rate": 1.396105087288549e-06, + "loss": 0.7899, + "step": 6310 + }, + { + "epoch": 1.79, + "learning_rate": 1.3597038395167516e-06, + "loss": 0.7755, + "step": 6320 + }, + { + "epoch": 1.79, + "learning_rate": 1.3237701659685854e-06, + "loss": 0.7765, + "step": 6330 + }, + { + "epoch": 1.8, + "learning_rate": 1.28830477736524e-06, + "loss": 0.7679, + "step": 6340 + }, + { + "epoch": 1.8, + "learning_rate": 1.253308375165857e-06, + "loss": 0.7881, + "step": 6350 + }, + { + "epoch": 1.8, + "learning_rate": 1.2187816515536105e-06, + "loss": 0.78, + "step": 6360 + }, + { + "epoch": 1.8, + "learning_rate": 1.184725289422073e-06, + "loss": 0.7893, + "step": 6370 + }, + { + "epoch": 1.81, + "learning_rate": 1.151139962361658e-06, + "loss": 0.7799, + "step": 6380 + }, + { + "epoch": 1.81, + "learning_rate": 1.1180263346463327e-06, + "loss": 0.7734, + "step": 6390 + }, + { + "epoch": 1.81, + "learning_rate": 1.0853850612204646e-06, + "loss": 0.7719, + "step": 6400 + }, + { + "epoch": 1.81, + "learning_rate": 1.053216787685865e-06, + "loss": 0.7752, + "step": 6410 + }, + { + "epoch": 1.82, + "learning_rate": 1.0215221502890254e-06, + "loss": 0.7758, + "step": 6420 + }, + { + "epoch": 1.82, + "learning_rate": 9.903017759085365e-07, + "loss": 0.7696, + "step": 6430 + }, + { + "epoch": 1.82, + "learning_rate": 9.595562820426758e-07, + "loss": 0.7828, + "step": 6440 + }, + { + "epoch": 1.83, + "learning_rate": 9.292862767972199e-07, + "loss": 0.7895, + "step": 6450 + }, + { + "epoch": 1.83, + "learning_rate": 8.994923588733856e-07, + "loss": 0.7845, + "step": 6460 + }, + { + "epoch": 1.83, + "learning_rate": 8.701751175560102e-07, + "loss": 0.771, + "step": 6470 + }, + { + "epoch": 1.83, + "learning_rate": 8.41335132701887e-07, + "loss": 0.7677, + "step": 6480 + }, + { + "epoch": 1.84, + "learning_rate": 8.129729747283016e-07, + "loss": 0.786, + "step": 6490 + }, + { + "epoch": 1.84, + "learning_rate": 7.85089204601741e-07, + "loss": 0.7883, + "step": 6500 + }, + { + "epoch": 1.84, + "learning_rate": 7.576843738268113e-07, + "loss": 0.7845, + "step": 6510 + }, + { + "epoch": 1.85, + "learning_rate": 7.307590244353263e-07, + "loss": 0.7837, + "step": 6520 + }, + { + "epoch": 1.85, + "learning_rate": 7.043136889755691e-07, + "loss": 0.7697, + "step": 6530 + }, + { + "epoch": 1.85, + "learning_rate": 6.783488905017871e-07, + "loss": 0.782, + "step": 6540 + }, + { + "epoch": 1.85, + "learning_rate": 6.528651425638272e-07, + "loss": 0.7923, + "step": 6550 + }, + { + "epoch": 1.86, + "learning_rate": 6.278629491969862e-07, + "loss": 0.7745, + "step": 6560 + }, + { + "epoch": 1.86, + "learning_rate": 6.033428049120326e-07, + "loss": 0.7882, + "step": 6570 + }, + { + "epoch": 1.86, + "learning_rate": 5.793051946854422e-07, + "loss": 0.7655, + "step": 6580 + }, + { + "epoch": 1.87, + "learning_rate": 5.557505939497915e-07, + "loss": 0.7864, + "step": 6590 + }, + { + "epoch": 1.87, + "learning_rate": 5.326794685843655e-07, + "loss": 0.7793, + "step": 6600 + }, + { + "epoch": 1.87, + "learning_rate": 5.100922749059239e-07, + "loss": 0.787, + "step": 6610 + }, + { + "epoch": 1.87, + "learning_rate": 4.879894596597018e-07, + "loss": 0.7651, + "step": 6620 + }, + { + "epoch": 1.88, + "learning_rate": 4.663714600105534e-07, + "loss": 0.7677, + "step": 6630 + }, + { + "epoch": 1.88, + "learning_rate": 4.452387035343203e-07, + "loss": 0.7847, + "step": 6640 + }, + { + "epoch": 1.88, + "learning_rate": 4.2459160820935153e-07, + "loss": 0.7849, + "step": 6650 + }, + { + "epoch": 1.89, + "learning_rate": 4.044305824082717e-07, + "loss": 0.7688, + "step": 6660 + }, + { + "epoch": 1.89, + "learning_rate": 3.84756024889868e-07, + "loss": 0.7796, + "step": 6670 + }, + { + "epoch": 1.89, + "learning_rate": 3.6556832479123504e-07, + "loss": 0.762, + "step": 6680 + }, + { + "epoch": 1.89, + "learning_rate": 3.468678616200427e-07, + "loss": 0.7947, + "step": 6690 + }, + { + "epoch": 1.9, + "learning_rate": 3.2865500524707217e-07, + "loss": 0.778, + "step": 6700 + }, + { + "epoch": 1.9, + "learning_rate": 3.109301158988609e-07, + "loss": 0.7822, + "step": 6710 + }, + { + "epoch": 1.9, + "learning_rate": 2.936935441506028e-07, + "loss": 0.7796, + "step": 6720 + }, + { + "epoch": 1.91, + "learning_rate": 2.769456309192037e-07, + "loss": 0.7749, + "step": 6730 + }, + { + "epoch": 1.91, + "learning_rate": 2.6068670745654224e-07, + "loss": 0.7731, + "step": 6740 + }, + { + "epoch": 1.91, + "learning_rate": 2.449170953429225e-07, + "loss": 0.7696, + "step": 6750 + }, + { + "epoch": 1.91, + "learning_rate": 2.296371064806957e-07, + "loss": 0.7868, + "step": 6760 + }, + { + "epoch": 1.92, + "learning_rate": 2.1484704308812053e-07, + "loss": 0.7805, + "step": 6770 + }, + { + "epoch": 1.92, + "learning_rate": 2.0054719769335428e-07, + "loss": 0.7802, + "step": 6780 + }, + { + "epoch": 1.92, + "learning_rate": 1.8673785312869063e-07, + "loss": 0.7787, + "step": 6790 + }, + { + "epoch": 1.93, + "learning_rate": 1.7341928252495033e-07, + "loss": 0.7886, + "step": 6800 + }, + { + "epoch": 1.93, + "learning_rate": 1.60591749306091e-07, + "loss": 0.7902, + "step": 6810 + }, + { + "epoch": 1.93, + "learning_rate": 1.4825550718398362e-07, + "loss": 0.7577, + "step": 6820 + }, + { + "epoch": 1.93, + "learning_rate": 1.3641080015341369e-07, + "loss": 0.7703, + "step": 6830 + }, + { + "epoch": 1.94, + "learning_rate": 1.2505786248723229e-07, + "loss": 0.7588, + "step": 6840 + }, + { + "epoch": 1.94, + "learning_rate": 1.1419691873174043e-07, + "loss": 0.7651, + "step": 6850 + }, + { + "epoch": 1.94, + "learning_rate": 1.038281837022398e-07, + "loss": 0.7739, + "step": 6860 + }, + { + "epoch": 1.95, + "learning_rate": 9.395186247878329e-08, + "loss": 0.7628, + "step": 6870 + }, + { + "epoch": 1.95, + "learning_rate": 8.456815040212562e-08, + "loss": 0.7739, + "step": 6880 + }, + { + "epoch": 1.95, + "learning_rate": 7.567723306984853e-08, + "loss": 0.7889, + "step": 6890 + }, + { + "epoch": 1.95, + "learning_rate": 6.727928633270264e-08, + "loss": 0.7842, + "step": 6900 + }, + { + "epoch": 1.96, + "learning_rate": 5.937447629112414e-08, + "loss": 0.7673, + "step": 6910 + }, + { + "epoch": 1.96, + "learning_rate": 5.196295929193739e-08, + "loss": 0.7881, + "step": 6920 + }, + { + "epoch": 1.96, + "learning_rate": 4.5044881925287994e-08, + "loss": 0.7665, + "step": 6930 + }, + { + "epoch": 1.96, + "learning_rate": 3.862038102172283e-08, + "loss": 0.7724, + "step": 6940 + }, + { + "epoch": 1.97, + "learning_rate": 3.268958364948671e-08, + "loss": 0.7703, + "step": 6950 + }, + { + "epoch": 1.97, + "learning_rate": 2.7252607112018823e-08, + "loss": 0.7615, + "step": 6960 + }, + { + "epoch": 1.97, + "learning_rate": 2.2309558945621257e-08, + "loss": 0.7853, + "step": 6970 + }, + { + "epoch": 1.98, + "learning_rate": 1.7860536917341243e-08, + "loss": 0.764, + "step": 6980 + }, + { + "epoch": 1.98, + "learning_rate": 1.3905629023031052e-08, + "loss": 0.773, + "step": 6990 + }, + { + "epoch": 1.98, + "learning_rate": 1.0444913485610498e-08, + "loss": 0.7812, + "step": 7000 + }, + { + "epoch": 1.98, + "learning_rate": 7.478458753518159e-09, + "loss": 0.7781, + "step": 7010 + }, + { + "epoch": 1.99, + "learning_rate": 5.006323499359699e-09, + "loss": 0.7871, + "step": 7020 + }, + { + "epoch": 1.99, + "learning_rate": 3.02855661874768e-09, + "loss": 0.7657, + "step": 7030 + }, + { + "epoch": 1.99, + "learning_rate": 1.5451972293301087e-09, + "loss": 0.7674, + "step": 7040 + }, + { + "epoch": 2.0, + "learning_rate": 5.56274670021617e-10, + "loss": 0.7881, + "step": 7050 + }, + { + "epoch": 2.0, + "learning_rate": 6.180850041781483e-11, + "loss": 0.8101, + "step": 7060 + }, + { + "epoch": 2.0, + "step": 7064, + "total_flos": 2.502171672110642e+19, + "train_loss": 0.819440008492324, + "train_runtime": 68529.0816, + "train_samples_per_second": 6.597, + "train_steps_per_second": 0.103 + } + ], + "max_steps": 7064, + "num_train_epochs": 2, + "total_flos": 2.502171672110642e+19, + "trial_name": null, + "trial_params": null +} diff --git a/sft-lora/training_args.bin b/sft-lora/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..3eed0ff4867b1994122fd7acbeae2361d0d3b65f --- /dev/null +++ b/sft-lora/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f9990bd8d9bf61dcf0d79a1a831b0934c6cc3a114d136458fc4cdd6dc2a9387 +size 3272 diff --git a/sft-lora/training_loss.png b/sft-lora/training_loss.png new file mode 100644 index 0000000000000000000000000000000000000000..71a9467c7cc876fd04b3f8ce2e9029948b99eeac Binary files /dev/null and b/sft-lora/training_loss.png differ diff --git a/sft-qlora/README.md b/sft-qlora/README.md new file mode 100644 index 0000000000000000000000000000000000000000..d290c902d52b2091d490255d35c9be86df84f437 --- /dev/null +++ b/sft-qlora/README.md @@ -0,0 +1,3 @@ +--- +library_name: peft +--- diff --git a/sft-qlora/adapter_config.json b/sft-qlora/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..2ef4676864a7f782259cd6700dcab8059e8973ab --- /dev/null +++ b/sft-qlora/adapter_config.json @@ -0,0 +1,20 @@ +{ + "base_model_name_or_path": "llama-13b-hf/", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layers_pattern": null, + "layers_to_transform": null, + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "revision": null, + "target_modules": [ + "q_proj", + "v_proj" + ], + "task_type": "CAUSAL_LM" +} \ No newline at end of file diff --git a/sft-qlora/adapter_model.bin b/sft-qlora/adapter_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..35c05f8f601d09128971397fd76df6aa27a27587 --- /dev/null +++ b/sft-qlora/adapter_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f19937f4db7566260b91168505f6cd4ef8d5e60e154668650d7e8b5d7b18b8fd +size 26269517 diff --git a/sft-qlora/all_results.json b/sft-qlora/all_results.json new file mode 100644 index 0000000000000000000000000000000000000000..fbc8abca687789f58146a86e9665e52ea5ca99cc --- /dev/null +++ b/sft-qlora/all_results.json @@ -0,0 +1,7 @@ +{ + "epoch": 2.0, + "train_loss": 0.8239178928553991, + "train_runtime": 71865.5404, + "train_samples_per_second": 6.291, + "train_steps_per_second": 0.098 +} \ No newline at end of file diff --git a/sft-qlora/checkpoint-1000/README.md b/sft-qlora/checkpoint-1000/README.md new file mode 100644 index 0000000000000000000000000000000000000000..d290c902d52b2091d490255d35c9be86df84f437 --- /dev/null +++ b/sft-qlora/checkpoint-1000/README.md @@ -0,0 +1,3 @@ +--- +library_name: peft +--- diff --git a/sft-qlora/checkpoint-1000/adapter_config.json b/sft-qlora/checkpoint-1000/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..2ef4676864a7f782259cd6700dcab8059e8973ab --- /dev/null +++ b/sft-qlora/checkpoint-1000/adapter_config.json @@ -0,0 +1,20 @@ +{ + "base_model_name_or_path": "llama-13b-hf/", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layers_pattern": null, + "layers_to_transform": null, + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "revision": null, + "target_modules": [ + "q_proj", + "v_proj" + ], + "task_type": "CAUSAL_LM" +} \ No newline at end of file diff --git a/sft-qlora/checkpoint-1000/adapter_model.bin b/sft-qlora/checkpoint-1000/adapter_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..3c60d2f67bf2bdfe6caea75a09a2b217b1f0235a --- /dev/null +++ b/sft-qlora/checkpoint-1000/adapter_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ade45b8ab268e80187b64e00af11a380aa6d233a836db8b0701b04018552b6b +size 26269517 diff --git a/sft-qlora/checkpoint-1000/finetuning_args.json b/sft-qlora/checkpoint-1000/finetuning_args.json new file mode 100644 index 0000000000000000000000000000000000000000..36a921b3eb84159ad54e7697e9d7d3e2fde38fec --- /dev/null +++ b/sft-qlora/checkpoint-1000/finetuning_args.json @@ -0,0 +1,13 @@ +{ + "finetuning_type": "lora", + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "lora_rank": 8, + "lora_target": [ + "q_proj", + "v_proj" + ], + "name_module_trainable": "mlp", + "num_hidden_layers": 32, + "num_layer_trainable": 3 +} diff --git a/sft-qlora/checkpoint-1000/optimizer.pt b/sft-qlora/checkpoint-1000/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..923ee97a1ba279753739a67306b35709911e5956 --- /dev/null +++ b/sft-qlora/checkpoint-1000/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed03eb792c08fc5347160de68b6408aa5b1aa89756d344fdcad1965ac02c1ccb +size 52562821 diff --git a/sft-qlora/checkpoint-1000/rng_state_0.pth b/sft-qlora/checkpoint-1000/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..e53764928430fe7114703f2645e078a66de956ac --- /dev/null +++ b/sft-qlora/checkpoint-1000/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1861187ed29864a34a274819277748606c140a8a54f9855b4010d1a3b1262252 +size 18679 diff --git a/sft-qlora/checkpoint-1000/rng_state_1.pth b/sft-qlora/checkpoint-1000/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..f0668465d157684b4930a2b5cbc0e928dc663b72 --- /dev/null +++ b/sft-qlora/checkpoint-1000/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df1a43a503c0c1cef10b6406a484cd1cc4786ea475b7a565189f777cc2921d11 +size 18679 diff --git a/sft-qlora/checkpoint-1000/rng_state_2.pth b/sft-qlora/checkpoint-1000/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..94781b4230eb7319a97e2dc109ee14a5f452dcdd --- /dev/null +++ b/sft-qlora/checkpoint-1000/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea8a5d9504efb5c0f487d4382ef1567e19039e679b4b3786908d3af7dd41db84 +size 18679 diff --git a/sft-qlora/checkpoint-1000/rng_state_3.pth b/sft-qlora/checkpoint-1000/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..8fef772262726c9870b9bdc274f09e6a03ec212d --- /dev/null +++ b/sft-qlora/checkpoint-1000/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05670d089596e2c7f3408383b58b668b05e193e7533b3391b742d6e5b3f5aa2d +size 18679 diff --git a/sft-qlora/checkpoint-1000/scheduler.pt b/sft-qlora/checkpoint-1000/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..79aae0d92ca00e8feef41d32ee19e5bdc9d491c8 --- /dev/null +++ b/sft-qlora/checkpoint-1000/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a591e3a265f45cc7ea1e1f12ab952409ddc4d51476e1e6e5b82f1289d6c35f2e +size 627 diff --git a/sft-qlora/checkpoint-1000/trainer_state.json b/sft-qlora/checkpoint-1000/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..77535c8241a053f3449b24767f36c3ce793d84c0 --- /dev/null +++ b/sft-qlora/checkpoint-1000/trainer_state.json @@ -0,0 +1,616 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 0.28312570781426954, + "global_step": 1000, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.0, + "learning_rate": 4.9999752766303955e-05, + "loss": 1.3185, + "step": 10 + }, + { + "epoch": 0.01, + "learning_rate": 4.999901107010577e-05, + "loss": 1.2795, + "step": 20 + }, + { + "epoch": 0.01, + "learning_rate": 4.999777492607524e-05, + "loss": 1.2266, + "step": 30 + }, + { + "epoch": 0.01, + "learning_rate": 4.9996044358661676e-05, + "loss": 1.19, + "step": 40 + }, + { + "epoch": 0.01, + "learning_rate": 4.9993819402093446e-05, + "loss": 1.1643, + "step": 50 + }, + { + "epoch": 0.02, + "learning_rate": 4.999110010037728e-05, + "loss": 1.1381, + "step": 60 + }, + { + "epoch": 0.02, + "learning_rate": 4.998788650729743e-05, + "loss": 1.1113, + "step": 70 + }, + { + "epoch": 0.02, + "learning_rate": 4.998417868641457e-05, + "loss": 1.0892, + "step": 80 + }, + { + "epoch": 0.03, + "learning_rate": 4.9979976711064556e-05, + "loss": 1.0801, + "step": 90 + }, + { + "epoch": 0.03, + "learning_rate": 4.9975280664357e-05, + "loss": 1.0822, + "step": 100 + }, + { + "epoch": 0.03, + "learning_rate": 4.997009063917356e-05, + "loss": 1.0794, + "step": 110 + }, + { + "epoch": 0.03, + "learning_rate": 4.996440673816617e-05, + "loss": 1.0419, + "step": 120 + }, + { + "epoch": 0.04, + "learning_rate": 4.995822907375498e-05, + "loss": 1.049, + "step": 130 + }, + { + "epoch": 0.04, + "learning_rate": 4.9951557768126136e-05, + "loss": 1.0202, + "step": 140 + }, + { + "epoch": 0.04, + "learning_rate": 4.9944392953229365e-05, + "loss": 1.0226, + "step": 150 + }, + { + "epoch": 0.05, + "learning_rate": 4.993673477077535e-05, + "loss": 0.9927, + "step": 160 + }, + { + "epoch": 0.05, + "learning_rate": 4.9928583372232954e-05, + "loss": 1.0006, + "step": 170 + }, + { + "epoch": 0.05, + "learning_rate": 4.991993891882622e-05, + "loss": 0.9999, + "step": 180 + }, + { + "epoch": 0.05, + "learning_rate": 4.991080158153115e-05, + "loss": 1.0003, + "step": 190 + }, + { + "epoch": 0.06, + "learning_rate": 4.990117154107236e-05, + "loss": 0.9875, + "step": 200 + }, + { + "epoch": 0.06, + "learning_rate": 4.989104898791949e-05, + "loss": 1.004, + "step": 210 + }, + { + "epoch": 0.06, + "learning_rate": 4.988043412228343e-05, + "loss": 0.9835, + "step": 220 + }, + { + "epoch": 0.07, + "learning_rate": 4.986932715411239e-05, + "loss": 0.9765, + "step": 230 + }, + { + "epoch": 0.07, + "learning_rate": 4.985772830308771e-05, + "loss": 0.9755, + "step": 240 + }, + { + "epoch": 0.07, + "learning_rate": 4.9845637798619536e-05, + "loss": 0.9798, + "step": 250 + }, + { + "epoch": 0.07, + "learning_rate": 4.983305587984227e-05, + "loss": 0.9779, + "step": 260 + }, + { + "epoch": 0.08, + "learning_rate": 4.981998279560986e-05, + "loss": 0.9707, + "step": 270 + }, + { + "epoch": 0.08, + "learning_rate": 4.980641880449086e-05, + "loss": 0.987, + "step": 280 + }, + { + "epoch": 0.08, + "learning_rate": 4.9792364174763323e-05, + "loss": 0.9493, + "step": 290 + }, + { + "epoch": 0.08, + "learning_rate": 4.977781918440949e-05, + "loss": 0.9701, + "step": 300 + }, + { + "epoch": 0.09, + "learning_rate": 4.97627841211103e-05, + "loss": 0.9476, + "step": 310 + }, + { + "epoch": 0.09, + "learning_rate": 4.97472592822397e-05, + "loss": 0.9218, + "step": 320 + }, + { + "epoch": 0.09, + "learning_rate": 4.9731244974858746e-05, + "loss": 0.9481, + "step": 330 + }, + { + "epoch": 0.1, + "learning_rate": 4.971474151570955e-05, + "loss": 0.9508, + "step": 340 + }, + { + "epoch": 0.1, + "learning_rate": 4.9697749231209025e-05, + "loss": 0.9587, + "step": 350 + }, + { + "epoch": 0.1, + "learning_rate": 4.968026845744237e-05, + "loss": 0.9371, + "step": 360 + }, + { + "epoch": 0.1, + "learning_rate": 4.96622995401565e-05, + "loss": 0.9242, + "step": 370 + }, + { + "epoch": 0.11, + "learning_rate": 4.9643842834753174e-05, + "loss": 0.9229, + "step": 380 + }, + { + "epoch": 0.11, + "learning_rate": 4.962489870628193e-05, + "loss": 0.9271, + "step": 390 + }, + { + "epoch": 0.11, + "learning_rate": 4.960546752943294e-05, + "loss": 0.9309, + "step": 400 + }, + { + "epoch": 0.12, + "learning_rate": 4.958554968852952e-05, + "loss": 0.9102, + "step": 410 + }, + { + "epoch": 0.12, + "learning_rate": 4.95651455775206e-05, + "loss": 0.9089, + "step": 420 + }, + { + "epoch": 0.12, + "learning_rate": 4.954425559997287e-05, + "loss": 0.9236, + "step": 430 + }, + { + "epoch": 0.12, + "learning_rate": 4.952288016906284e-05, + "loss": 0.9184, + "step": 440 + }, + { + "epoch": 0.13, + "learning_rate": 4.9501019707568665e-05, + "loss": 0.9112, + "step": 450 + }, + { + "epoch": 0.13, + "learning_rate": 4.947867464786174e-05, + "loss": 0.9178, + "step": 460 + }, + { + "epoch": 0.13, + "learning_rate": 4.945584543189823e-05, + "loss": 0.9364, + "step": 470 + }, + { + "epoch": 0.14, + "learning_rate": 4.943253251121022e-05, + "loss": 0.9262, + "step": 480 + }, + { + "epoch": 0.14, + "learning_rate": 4.9408736346896894e-05, + "loss": 0.9037, + "step": 490 + }, + { + "epoch": 0.14, + "learning_rate": 4.938445740961534e-05, + "loss": 0.928, + "step": 500 + }, + { + "epoch": 0.14, + "learning_rate": 4.935969617957126e-05, + "loss": 0.9064, + "step": 510 + }, + { + "epoch": 0.15, + "learning_rate": 4.93344531465095e-05, + "loss": 0.9107, + "step": 520 + }, + { + "epoch": 0.15, + "learning_rate": 4.930872880970432e-05, + "loss": 0.905, + "step": 530 + }, + { + "epoch": 0.15, + "learning_rate": 4.9282523677949556e-05, + "loss": 0.9234, + "step": 540 + }, + { + "epoch": 0.16, + "learning_rate": 4.9255838269548524e-05, + "loss": 0.906, + "step": 550 + }, + { + "epoch": 0.16, + "learning_rate": 4.9228673112303814e-05, + "loss": 0.8885, + "step": 560 + }, + { + "epoch": 0.16, + "learning_rate": 4.9201028743506794e-05, + "loss": 0.9103, + "step": 570 + }, + { + "epoch": 0.16, + "learning_rate": 4.917290570992702e-05, + "loss": 0.895, + "step": 580 + }, + { + "epoch": 0.17, + "learning_rate": 4.9144304567801415e-05, + "loss": 0.8948, + "step": 590 + }, + { + "epoch": 0.17, + "learning_rate": 4.911522588282327e-05, + "loss": 0.9109, + "step": 600 + }, + { + "epoch": 0.17, + "learning_rate": 4.908567023013104e-05, + "loss": 0.8914, + "step": 610 + }, + { + "epoch": 0.18, + "learning_rate": 4.9055638194296994e-05, + "loss": 0.892, + "step": 620 + }, + { + "epoch": 0.18, + "learning_rate": 4.902513036931562e-05, + "loss": 0.9049, + "step": 630 + }, + { + "epoch": 0.18, + "learning_rate": 4.89941473585919e-05, + "loss": 0.904, + "step": 640 + }, + { + "epoch": 0.18, + "learning_rate": 4.89626897749294e-05, + "loss": 0.8983, + "step": 650 + }, + { + "epoch": 0.19, + "learning_rate": 4.893075824051807e-05, + "loss": 0.8884, + "step": 660 + }, + { + "epoch": 0.19, + "learning_rate": 4.889835338692201e-05, + "loss": 0.8886, + "step": 670 + }, + { + "epoch": 0.19, + "learning_rate": 4.886547585506698e-05, + "loss": 0.8998, + "step": 680 + }, + { + "epoch": 0.2, + "learning_rate": 4.8832126295227656e-05, + "loss": 0.8753, + "step": 690 + }, + { + "epoch": 0.2, + "learning_rate": 4.879830536701485e-05, + "loss": 0.8937, + "step": 700 + }, + { + "epoch": 0.2, + "learning_rate": 4.876401373936239e-05, + "loss": 0.8921, + "step": 710 + }, + { + "epoch": 0.2, + "learning_rate": 4.8729252090513964e-05, + "loss": 0.8801, + "step": 720 + }, + { + "epoch": 0.21, + "learning_rate": 4.869402110800963e-05, + "loss": 0.8887, + "step": 730 + }, + { + "epoch": 0.21, + "learning_rate": 4.865832148867228e-05, + "loss": 0.8793, + "step": 740 + }, + { + "epoch": 0.21, + "learning_rate": 4.8622153938593816e-05, + "loss": 0.8811, + "step": 750 + }, + { + "epoch": 0.22, + "learning_rate": 4.8585519173121205e-05, + "loss": 0.8924, + "step": 760 + }, + { + "epoch": 0.22, + "learning_rate": 4.8548417916842324e-05, + "loss": 0.8988, + "step": 770 + }, + { + "epoch": 0.22, + "learning_rate": 4.851085090357163e-05, + "loss": 0.8907, + "step": 780 + }, + { + "epoch": 0.22, + "learning_rate": 4.847281887633565e-05, + "loss": 0.8879, + "step": 790 + }, + { + "epoch": 0.23, + "learning_rate": 4.843432258735827e-05, + "loss": 0.8796, + "step": 800 + }, + { + "epoch": 0.23, + "learning_rate": 4.839536279804589e-05, + "loss": 0.8965, + "step": 810 + }, + { + "epoch": 0.23, + "learning_rate": 4.835594027897231e-05, + "loss": 0.8678, + "step": 820 + }, + { + "epoch": 0.23, + "learning_rate": 4.831605580986355e-05, + "loss": 0.8857, + "step": 830 + }, + { + "epoch": 0.24, + "learning_rate": 4.8275710179582366e-05, + "loss": 0.8805, + "step": 840 + }, + { + "epoch": 0.24, + "learning_rate": 4.823490418611273e-05, + "loss": 0.865, + "step": 850 + }, + { + "epoch": 0.24, + "learning_rate": 4.819363863654395e-05, + "loss": 0.8892, + "step": 860 + }, + { + "epoch": 0.25, + "learning_rate": 4.8151914347054776e-05, + "loss": 0.8589, + "step": 870 + }, + { + "epoch": 0.25, + "learning_rate": 4.810973214289724e-05, + "loss": 0.8819, + "step": 880 + }, + { + "epoch": 0.25, + "learning_rate": 4.806709285838031e-05, + "loss": 0.8778, + "step": 890 + }, + { + "epoch": 0.25, + "learning_rate": 4.8023997336853434e-05, + "loss": 0.8725, + "step": 900 + }, + { + "epoch": 0.26, + "learning_rate": 4.7980446430689804e-05, + "loss": 0.8856, + "step": 910 + }, + { + "epoch": 0.26, + "learning_rate": 4.793644100126954e-05, + "loss": 0.8836, + "step": 920 + }, + { + "epoch": 0.26, + "learning_rate": 4.7891981918962656e-05, + "loss": 0.8684, + "step": 930 + }, + { + "epoch": 0.27, + "learning_rate": 4.784707006311179e-05, + "loss": 0.8671, + "step": 940 + }, + { + "epoch": 0.27, + "learning_rate": 4.780170632201487e-05, + "loss": 0.868, + "step": 950 + }, + { + "epoch": 0.27, + "learning_rate": 4.7755891592907556e-05, + "loss": 0.8683, + "step": 960 + }, + { + "epoch": 0.27, + "learning_rate": 4.7709626781945397e-05, + "loss": 0.8581, + "step": 970 + }, + { + "epoch": 0.28, + "learning_rate": 4.766291280418603e-05, + "loss": 0.8653, + "step": 980 + }, + { + "epoch": 0.28, + "learning_rate": 4.761575058357101e-05, + "loss": 0.8677, + "step": 990 + }, + { + "epoch": 0.28, + "learning_rate": 4.756814105290753e-05, + "loss": 0.8734, + "step": 1000 + } + ], + "max_steps": 7064, + "num_train_epochs": 2, + "total_flos": 1.7931999261260513e+18, + "trial_name": null, + "trial_params": null +} diff --git a/sft-qlora/checkpoint-1000/training_args.bin b/sft-qlora/checkpoint-1000/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..e8bd5ea7554270f553d5441a16ce5f0105c78887 --- /dev/null +++ b/sft-qlora/checkpoint-1000/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:131cb9a8eab84a15c7b110e05a98a526550eba69b35fa4c758b43a4caafa6db7 +size 3275 diff --git a/sft-qlora/checkpoint-2000/README.md b/sft-qlora/checkpoint-2000/README.md new file mode 100644 index 0000000000000000000000000000000000000000..d290c902d52b2091d490255d35c9be86df84f437 --- /dev/null +++ b/sft-qlora/checkpoint-2000/README.md @@ -0,0 +1,3 @@ +--- +library_name: peft +--- diff --git a/sft-qlora/checkpoint-2000/adapter_config.json b/sft-qlora/checkpoint-2000/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..2ef4676864a7f782259cd6700dcab8059e8973ab --- /dev/null +++ b/sft-qlora/checkpoint-2000/adapter_config.json @@ -0,0 +1,20 @@ +{ + "base_model_name_or_path": "llama-13b-hf/", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layers_pattern": null, + "layers_to_transform": null, + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "revision": null, + "target_modules": [ + "q_proj", + "v_proj" + ], + "task_type": "CAUSAL_LM" +} \ No newline at end of file diff --git a/sft-qlora/checkpoint-2000/adapter_model.bin b/sft-qlora/checkpoint-2000/adapter_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..d60a4f2df4164ba7c353e60f7333a9b5c7d6daef --- /dev/null +++ b/sft-qlora/checkpoint-2000/adapter_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3405401245441ae54470d66a897e9c7a3346603c84a3433ed319bac97d189b9d +size 26269517 diff --git a/sft-qlora/checkpoint-2000/finetuning_args.json b/sft-qlora/checkpoint-2000/finetuning_args.json new file mode 100644 index 0000000000000000000000000000000000000000..36a921b3eb84159ad54e7697e9d7d3e2fde38fec --- /dev/null +++ b/sft-qlora/checkpoint-2000/finetuning_args.json @@ -0,0 +1,13 @@ +{ + "finetuning_type": "lora", + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "lora_rank": 8, + "lora_target": [ + "q_proj", + "v_proj" + ], + "name_module_trainable": "mlp", + "num_hidden_layers": 32, + "num_layer_trainable": 3 +} diff --git a/sft-qlora/checkpoint-2000/optimizer.pt b/sft-qlora/checkpoint-2000/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..33529dbb87e92755069ebecc728729e615450915 --- /dev/null +++ b/sft-qlora/checkpoint-2000/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a54ab2d2457a98ff5826f0bee892166ecb756200b518bc4debe7d2fe0edf339 +size 52562821 diff --git a/sft-qlora/checkpoint-2000/rng_state_0.pth b/sft-qlora/checkpoint-2000/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..49df96d969c916b860405c00c88024ca09bcf369 --- /dev/null +++ b/sft-qlora/checkpoint-2000/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7465f2ce05639a998be3048ae8b2b3ddc511bd8df0ac0af63a4781d83ba13d1 +size 18679 diff --git a/sft-qlora/checkpoint-2000/rng_state_1.pth b/sft-qlora/checkpoint-2000/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..cefe4e53c0b772e71fcb83f33003393cea0b087e --- /dev/null +++ b/sft-qlora/checkpoint-2000/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ee3a01821de7105bb38914d05f567f5ca9005a475248f6ff57a994dda760946 +size 18679 diff --git a/sft-qlora/checkpoint-2000/rng_state_2.pth b/sft-qlora/checkpoint-2000/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..0216babc382454d6b6ee1c14da388ffb76d01769 --- /dev/null +++ b/sft-qlora/checkpoint-2000/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22f7328df9304c13f5f3ac9062a268875c9d2eb34607511e75df0f729cd3e462 +size 18679 diff --git a/sft-qlora/checkpoint-2000/rng_state_3.pth b/sft-qlora/checkpoint-2000/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..aa2991275b5aeab5d5bbff85b8589eb48d78b93b --- /dev/null +++ b/sft-qlora/checkpoint-2000/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:363a7b98f242c61426c18c7085f5f8d7a1a938e734adb4c74cdcb7e8c3a8f683 +size 18679 diff --git a/sft-qlora/checkpoint-2000/scheduler.pt b/sft-qlora/checkpoint-2000/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8f579a1bc205ecfd68870c1065bf18043c82ec1 --- /dev/null +++ b/sft-qlora/checkpoint-2000/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7e63b0f7d224d36a047a120fdc989122c10ff555fd9e9271cc2a05e908022f9 +size 627 diff --git a/sft-qlora/checkpoint-2000/trainer_state.json b/sft-qlora/checkpoint-2000/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..cc7d73ef4057ed5edd4357ae517caf156d3c35fd --- /dev/null +++ b/sft-qlora/checkpoint-2000/trainer_state.json @@ -0,0 +1,1216 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 0.5662514156285391, + "global_step": 2000, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.0, + "learning_rate": 4.9999752766303955e-05, + "loss": 1.3185, + "step": 10 + }, + { + "epoch": 0.01, + "learning_rate": 4.999901107010577e-05, + "loss": 1.2795, + "step": 20 + }, + { + "epoch": 0.01, + "learning_rate": 4.999777492607524e-05, + "loss": 1.2266, + "step": 30 + }, + { + "epoch": 0.01, + "learning_rate": 4.9996044358661676e-05, + "loss": 1.19, + "step": 40 + }, + { + "epoch": 0.01, + "learning_rate": 4.9993819402093446e-05, + "loss": 1.1643, + "step": 50 + }, + { + "epoch": 0.02, + "learning_rate": 4.999110010037728e-05, + "loss": 1.1381, + "step": 60 + }, + { + "epoch": 0.02, + "learning_rate": 4.998788650729743e-05, + "loss": 1.1113, + "step": 70 + }, + { + "epoch": 0.02, + "learning_rate": 4.998417868641457e-05, + "loss": 1.0892, + "step": 80 + }, + { + "epoch": 0.03, + "learning_rate": 4.9979976711064556e-05, + "loss": 1.0801, + "step": 90 + }, + { + "epoch": 0.03, + "learning_rate": 4.9975280664357e-05, + "loss": 1.0822, + "step": 100 + }, + { + "epoch": 0.03, + "learning_rate": 4.997009063917356e-05, + "loss": 1.0794, + "step": 110 + }, + { + "epoch": 0.03, + "learning_rate": 4.996440673816617e-05, + "loss": 1.0419, + "step": 120 + }, + { + "epoch": 0.04, + "learning_rate": 4.995822907375498e-05, + "loss": 1.049, + "step": 130 + }, + { + "epoch": 0.04, + "learning_rate": 4.9951557768126136e-05, + "loss": 1.0202, + "step": 140 + }, + { + "epoch": 0.04, + "learning_rate": 4.9944392953229365e-05, + "loss": 1.0226, + "step": 150 + }, + { + "epoch": 0.05, + "learning_rate": 4.993673477077535e-05, + "loss": 0.9927, + "step": 160 + }, + { + "epoch": 0.05, + "learning_rate": 4.9928583372232954e-05, + "loss": 1.0006, + "step": 170 + }, + { + "epoch": 0.05, + "learning_rate": 4.991993891882622e-05, + "loss": 0.9999, + "step": 180 + }, + { + "epoch": 0.05, + "learning_rate": 4.991080158153115e-05, + "loss": 1.0003, + "step": 190 + }, + { + "epoch": 0.06, + "learning_rate": 4.990117154107236e-05, + "loss": 0.9875, + "step": 200 + }, + { + "epoch": 0.06, + "learning_rate": 4.989104898791949e-05, + "loss": 1.004, + "step": 210 + }, + { + "epoch": 0.06, + "learning_rate": 4.988043412228343e-05, + "loss": 0.9835, + "step": 220 + }, + { + "epoch": 0.07, + "learning_rate": 4.986932715411239e-05, + "loss": 0.9765, + "step": 230 + }, + { + "epoch": 0.07, + "learning_rate": 4.985772830308771e-05, + "loss": 0.9755, + "step": 240 + }, + { + "epoch": 0.07, + "learning_rate": 4.9845637798619536e-05, + "loss": 0.9798, + "step": 250 + }, + { + "epoch": 0.07, + "learning_rate": 4.983305587984227e-05, + "loss": 0.9779, + "step": 260 + }, + { + "epoch": 0.08, + "learning_rate": 4.981998279560986e-05, + "loss": 0.9707, + "step": 270 + }, + { + "epoch": 0.08, + "learning_rate": 4.980641880449086e-05, + "loss": 0.987, + "step": 280 + }, + { + "epoch": 0.08, + "learning_rate": 4.9792364174763323e-05, + "loss": 0.9493, + "step": 290 + }, + { + "epoch": 0.08, + "learning_rate": 4.977781918440949e-05, + "loss": 0.9701, + "step": 300 + }, + { + "epoch": 0.09, + "learning_rate": 4.97627841211103e-05, + "loss": 0.9476, + "step": 310 + }, + { + "epoch": 0.09, + "learning_rate": 4.97472592822397e-05, + "loss": 0.9218, + "step": 320 + }, + { + "epoch": 0.09, + "learning_rate": 4.9731244974858746e-05, + "loss": 0.9481, + "step": 330 + }, + { + "epoch": 0.1, + "learning_rate": 4.971474151570955e-05, + "loss": 0.9508, + "step": 340 + }, + { + "epoch": 0.1, + "learning_rate": 4.9697749231209025e-05, + "loss": 0.9587, + "step": 350 + }, + { + "epoch": 0.1, + "learning_rate": 4.968026845744237e-05, + "loss": 0.9371, + "step": 360 + }, + { + "epoch": 0.1, + "learning_rate": 4.96622995401565e-05, + "loss": 0.9242, + "step": 370 + }, + { + "epoch": 0.11, + "learning_rate": 4.9643842834753174e-05, + "loss": 0.9229, + "step": 380 + }, + { + "epoch": 0.11, + "learning_rate": 4.962489870628193e-05, + "loss": 0.9271, + "step": 390 + }, + { + "epoch": 0.11, + "learning_rate": 4.960546752943294e-05, + "loss": 0.9309, + "step": 400 + }, + { + "epoch": 0.12, + "learning_rate": 4.958554968852952e-05, + "loss": 0.9102, + "step": 410 + }, + { + "epoch": 0.12, + "learning_rate": 4.95651455775206e-05, + "loss": 0.9089, + "step": 420 + }, + { + "epoch": 0.12, + "learning_rate": 4.954425559997287e-05, + "loss": 0.9236, + "step": 430 + }, + { + "epoch": 0.12, + "learning_rate": 4.952288016906284e-05, + "loss": 0.9184, + "step": 440 + }, + { + "epoch": 0.13, + "learning_rate": 4.9501019707568665e-05, + "loss": 0.9112, + "step": 450 + }, + { + "epoch": 0.13, + "learning_rate": 4.947867464786174e-05, + "loss": 0.9178, + "step": 460 + }, + { + "epoch": 0.13, + "learning_rate": 4.945584543189823e-05, + "loss": 0.9364, + "step": 470 + }, + { + "epoch": 0.14, + "learning_rate": 4.943253251121022e-05, + "loss": 0.9262, + "step": 480 + }, + { + "epoch": 0.14, + "learning_rate": 4.9408736346896894e-05, + "loss": 0.9037, + "step": 490 + }, + { + "epoch": 0.14, + "learning_rate": 4.938445740961534e-05, + "loss": 0.928, + "step": 500 + }, + { + "epoch": 0.14, + "learning_rate": 4.935969617957126e-05, + "loss": 0.9064, + "step": 510 + }, + { + "epoch": 0.15, + "learning_rate": 4.93344531465095e-05, + "loss": 0.9107, + "step": 520 + }, + { + "epoch": 0.15, + "learning_rate": 4.930872880970432e-05, + "loss": 0.905, + "step": 530 + }, + { + "epoch": 0.15, + "learning_rate": 4.9282523677949556e-05, + "loss": 0.9234, + "step": 540 + }, + { + "epoch": 0.16, + "learning_rate": 4.9255838269548524e-05, + "loss": 0.906, + "step": 550 + }, + { + "epoch": 0.16, + "learning_rate": 4.9228673112303814e-05, + "loss": 0.8885, + "step": 560 + }, + { + "epoch": 0.16, + "learning_rate": 4.9201028743506794e-05, + "loss": 0.9103, + "step": 570 + }, + { + "epoch": 0.16, + "learning_rate": 4.917290570992702e-05, + "loss": 0.895, + "step": 580 + }, + { + "epoch": 0.17, + "learning_rate": 4.9144304567801415e-05, + "loss": 0.8948, + "step": 590 + }, + { + "epoch": 0.17, + "learning_rate": 4.911522588282327e-05, + "loss": 0.9109, + "step": 600 + }, + { + "epoch": 0.17, + "learning_rate": 4.908567023013104e-05, + "loss": 0.8914, + "step": 610 + }, + { + "epoch": 0.18, + "learning_rate": 4.9055638194296994e-05, + "loss": 0.892, + "step": 620 + }, + { + "epoch": 0.18, + "learning_rate": 4.902513036931562e-05, + "loss": 0.9049, + "step": 630 + }, + { + "epoch": 0.18, + "learning_rate": 4.89941473585919e-05, + "loss": 0.904, + "step": 640 + }, + { + "epoch": 0.18, + "learning_rate": 4.89626897749294e-05, + "loss": 0.8983, + "step": 650 + }, + { + "epoch": 0.19, + "learning_rate": 4.893075824051807e-05, + "loss": 0.8884, + "step": 660 + }, + { + "epoch": 0.19, + "learning_rate": 4.889835338692201e-05, + "loss": 0.8886, + "step": 670 + }, + { + "epoch": 0.19, + "learning_rate": 4.886547585506698e-05, + "loss": 0.8998, + "step": 680 + }, + { + "epoch": 0.2, + "learning_rate": 4.8832126295227656e-05, + "loss": 0.8753, + "step": 690 + }, + { + "epoch": 0.2, + "learning_rate": 4.879830536701485e-05, + "loss": 0.8937, + "step": 700 + }, + { + "epoch": 0.2, + "learning_rate": 4.876401373936239e-05, + "loss": 0.8921, + "step": 710 + }, + { + "epoch": 0.2, + "learning_rate": 4.8729252090513964e-05, + "loss": 0.8801, + "step": 720 + }, + { + "epoch": 0.21, + "learning_rate": 4.869402110800963e-05, + "loss": 0.8887, + "step": 730 + }, + { + "epoch": 0.21, + "learning_rate": 4.865832148867228e-05, + "loss": 0.8793, + "step": 740 + }, + { + "epoch": 0.21, + "learning_rate": 4.8622153938593816e-05, + "loss": 0.8811, + "step": 750 + }, + { + "epoch": 0.22, + "learning_rate": 4.8585519173121205e-05, + "loss": 0.8924, + "step": 760 + }, + { + "epoch": 0.22, + "learning_rate": 4.8548417916842324e-05, + "loss": 0.8988, + "step": 770 + }, + { + "epoch": 0.22, + "learning_rate": 4.851085090357163e-05, + "loss": 0.8907, + "step": 780 + }, + { + "epoch": 0.22, + "learning_rate": 4.847281887633565e-05, + "loss": 0.8879, + "step": 790 + }, + { + "epoch": 0.23, + "learning_rate": 4.843432258735827e-05, + "loss": 0.8796, + "step": 800 + }, + { + "epoch": 0.23, + "learning_rate": 4.839536279804589e-05, + "loss": 0.8965, + "step": 810 + }, + { + "epoch": 0.23, + "learning_rate": 4.835594027897231e-05, + "loss": 0.8678, + "step": 820 + }, + { + "epoch": 0.23, + "learning_rate": 4.831605580986355e-05, + "loss": 0.8857, + "step": 830 + }, + { + "epoch": 0.24, + "learning_rate": 4.8275710179582366e-05, + "loss": 0.8805, + "step": 840 + }, + { + "epoch": 0.24, + "learning_rate": 4.823490418611273e-05, + "loss": 0.865, + "step": 850 + }, + { + "epoch": 0.24, + "learning_rate": 4.819363863654395e-05, + "loss": 0.8892, + "step": 860 + }, + { + "epoch": 0.25, + "learning_rate": 4.8151914347054776e-05, + "loss": 0.8589, + "step": 870 + }, + { + "epoch": 0.25, + "learning_rate": 4.810973214289724e-05, + "loss": 0.8819, + "step": 880 + }, + { + "epoch": 0.25, + "learning_rate": 4.806709285838031e-05, + "loss": 0.8778, + "step": 890 + }, + { + "epoch": 0.25, + "learning_rate": 4.8023997336853434e-05, + "loss": 0.8725, + "step": 900 + }, + { + "epoch": 0.26, + "learning_rate": 4.7980446430689804e-05, + "loss": 0.8856, + "step": 910 + }, + { + "epoch": 0.26, + "learning_rate": 4.793644100126954e-05, + "loss": 0.8836, + "step": 920 + }, + { + "epoch": 0.26, + "learning_rate": 4.7891981918962656e-05, + "loss": 0.8684, + "step": 930 + }, + { + "epoch": 0.27, + "learning_rate": 4.784707006311179e-05, + "loss": 0.8671, + "step": 940 + }, + { + "epoch": 0.27, + "learning_rate": 4.780170632201487e-05, + "loss": 0.868, + "step": 950 + }, + { + "epoch": 0.27, + "learning_rate": 4.7755891592907556e-05, + "loss": 0.8683, + "step": 960 + }, + { + "epoch": 0.27, + "learning_rate": 4.7709626781945397e-05, + "loss": 0.8581, + "step": 970 + }, + { + "epoch": 0.28, + "learning_rate": 4.766291280418603e-05, + "loss": 0.8653, + "step": 980 + }, + { + "epoch": 0.28, + "learning_rate": 4.761575058357101e-05, + "loss": 0.8677, + "step": 990 + }, + { + "epoch": 0.28, + "learning_rate": 4.756814105290753e-05, + "loss": 0.8734, + "step": 1000 + }, + { + "epoch": 0.29, + "learning_rate": 4.7520085153850014e-05, + "loss": 0.8583, + "step": 1010 + }, + { + "epoch": 0.29, + "learning_rate": 4.7471583836881476e-05, + "loss": 0.874, + "step": 1020 + }, + { + "epoch": 0.29, + "learning_rate": 4.742263806129469e-05, + "loss": 0.8554, + "step": 1030 + }, + { + "epoch": 0.29, + "learning_rate": 4.737324879517326e-05, + "loss": 0.8807, + "step": 1040 + }, + { + "epoch": 0.3, + "learning_rate": 4.732341701537245e-05, + "loss": 0.8633, + "step": 1050 + }, + { + "epoch": 0.3, + "learning_rate": 4.727314370749988e-05, + "loss": 0.875, + "step": 1060 + }, + { + "epoch": 0.3, + "learning_rate": 4.7222429865896e-05, + "loss": 0.8709, + "step": 1070 + }, + { + "epoch": 0.31, + "learning_rate": 4.717127649361444e-05, + "loss": 0.8634, + "step": 1080 + }, + { + "epoch": 0.31, + "learning_rate": 4.71196846024022e-05, + "loss": 0.8566, + "step": 1090 + }, + { + "epoch": 0.31, + "learning_rate": 4.7067655212679585e-05, + "loss": 0.8667, + "step": 1100 + }, + { + "epoch": 0.31, + "learning_rate": 4.701518935352006e-05, + "loss": 0.8688, + "step": 1110 + }, + { + "epoch": 0.32, + "learning_rate": 4.69622880626299e-05, + "loss": 0.8573, + "step": 1120 + }, + { + "epoch": 0.32, + "learning_rate": 4.690895238632762e-05, + "loss": 0.8576, + "step": 1130 + }, + { + "epoch": 0.32, + "learning_rate": 4.685518337952335e-05, + "loss": 0.8525, + "step": 1140 + }, + { + "epoch": 0.33, + "learning_rate": 4.680098210569789e-05, + "loss": 0.8656, + "step": 1150 + }, + { + "epoch": 0.33, + "learning_rate": 4.674634963688177e-05, + "loss": 0.8703, + "step": 1160 + }, + { + "epoch": 0.33, + "learning_rate": 4.669128705363394e-05, + "loss": 0.8616, + "step": 1170 + }, + { + "epoch": 0.33, + "learning_rate": 4.663579544502049e-05, + "loss": 0.8677, + "step": 1180 + }, + { + "epoch": 0.34, + "learning_rate": 4.657987590859305e-05, + "loss": 0.8525, + "step": 1190 + }, + { + "epoch": 0.34, + "learning_rate": 4.652352955036713e-05, + "loss": 0.8526, + "step": 1200 + }, + { + "epoch": 0.34, + "learning_rate": 4.646675748480019e-05, + "loss": 0.8586, + "step": 1210 + }, + { + "epoch": 0.35, + "learning_rate": 4.640956083476964e-05, + "loss": 0.8542, + "step": 1220 + }, + { + "epoch": 0.35, + "learning_rate": 4.635194073155061e-05, + "loss": 0.8517, + "step": 1230 + }, + { + "epoch": 0.35, + "learning_rate": 4.62938983147936e-05, + "loss": 0.8592, + "step": 1240 + }, + { + "epoch": 0.35, + "learning_rate": 4.62354347325019e-05, + "loss": 0.8678, + "step": 1250 + }, + { + "epoch": 0.36, + "learning_rate": 4.6176551141008916e-05, + "loss": 0.8644, + "step": 1260 + }, + { + "epoch": 0.36, + "learning_rate": 4.611724870495528e-05, + "loss": 0.8541, + "step": 1270 + }, + { + "epoch": 0.36, + "learning_rate": 4.605752859726583e-05, + "loss": 0.8438, + "step": 1280 + }, + { + "epoch": 0.37, + "learning_rate": 4.5997391999126397e-05, + "loss": 0.8604, + "step": 1290 + }, + { + "epoch": 0.37, + "learning_rate": 4.5936840099960465e-05, + "loss": 0.8633, + "step": 1300 + }, + { + "epoch": 0.37, + "learning_rate": 4.587587409740561e-05, + "loss": 0.8437, + "step": 1310 + }, + { + "epoch": 0.37, + "learning_rate": 4.581449519728986e-05, + "loss": 0.8466, + "step": 1320 + }, + { + "epoch": 0.38, + "learning_rate": 4.575270461360779e-05, + "loss": 0.8457, + "step": 1330 + }, + { + "epoch": 0.38, + "learning_rate": 4.569050356849655e-05, + "loss": 0.8477, + "step": 1340 + }, + { + "epoch": 0.38, + "learning_rate": 4.562789329221169e-05, + "loss": 0.8608, + "step": 1350 + }, + { + "epoch": 0.39, + "learning_rate": 4.5564875023102796e-05, + "loss": 0.8555, + "step": 1360 + }, + { + "epoch": 0.39, + "learning_rate": 4.550145000758905e-05, + "loss": 0.8624, + "step": 1370 + }, + { + "epoch": 0.39, + "learning_rate": 4.543761950013453e-05, + "loss": 0.8613, + "step": 1380 + }, + { + "epoch": 0.39, + "learning_rate": 4.537338476322341e-05, + "loss": 0.849, + "step": 1390 + }, + { + "epoch": 0.4, + "learning_rate": 4.530874706733502e-05, + "loss": 0.858, + "step": 1400 + }, + { + "epoch": 0.4, + "learning_rate": 4.524370769091866e-05, + "loss": 0.8468, + "step": 1410 + }, + { + "epoch": 0.4, + "learning_rate": 4.5178267920368366e-05, + "loss": 0.8624, + "step": 1420 + }, + { + "epoch": 0.4, + "learning_rate": 4.511242904999746e-05, + "loss": 0.8464, + "step": 1430 + }, + { + "epoch": 0.41, + "learning_rate": 4.50461923820129e-05, + "loss": 0.8575, + "step": 1440 + }, + { + "epoch": 0.41, + "learning_rate": 4.497955922648961e-05, + "loss": 0.8587, + "step": 1450 + }, + { + "epoch": 0.41, + "learning_rate": 4.491253090134447e-05, + "loss": 0.8517, + "step": 1460 + }, + { + "epoch": 0.42, + "learning_rate": 4.4845108732310355e-05, + "loss": 0.8427, + "step": 1470 + }, + { + "epoch": 0.42, + "learning_rate": 4.4777294052909804e-05, + "loss": 0.8588, + "step": 1480 + }, + { + "epoch": 0.42, + "learning_rate": 4.470908820442873e-05, + "loss": 0.8516, + "step": 1490 + }, + { + "epoch": 0.42, + "learning_rate": 4.464049253588985e-05, + "loss": 0.8408, + "step": 1500 + }, + { + "epoch": 0.43, + "learning_rate": 4.457150840402604e-05, + "loss": 0.8513, + "step": 1510 + }, + { + "epoch": 0.43, + "learning_rate": 4.450213717325343e-05, + "loss": 0.8554, + "step": 1520 + }, + { + "epoch": 0.43, + "learning_rate": 4.443238021564448e-05, + "loss": 0.8598, + "step": 1530 + }, + { + "epoch": 0.44, + "learning_rate": 4.4362238910900835e-05, + "loss": 0.8495, + "step": 1540 + }, + { + "epoch": 0.44, + "learning_rate": 4.4291714646326024e-05, + "loss": 0.8338, + "step": 1550 + }, + { + "epoch": 0.44, + "learning_rate": 4.4220808816797995e-05, + "loss": 0.8576, + "step": 1560 + }, + { + "epoch": 0.44, + "learning_rate": 4.414952282474158e-05, + "loss": 0.8593, + "step": 1570 + }, + { + "epoch": 0.45, + "learning_rate": 4.407785808010073e-05, + "loss": 0.8534, + "step": 1580 + }, + { + "epoch": 0.45, + "learning_rate": 4.400581600031062e-05, + "loss": 0.8564, + "step": 1590 + }, + { + "epoch": 0.45, + "learning_rate": 4.3933398010269614e-05, + "loss": 0.8446, + "step": 1600 + }, + { + "epoch": 0.46, + "learning_rate": 4.386060554231111e-05, + "loss": 0.8445, + "step": 1610 + }, + { + "epoch": 0.46, + "learning_rate": 4.378744003617517e-05, + "loss": 0.8281, + "step": 1620 + }, + { + "epoch": 0.46, + "learning_rate": 4.371390293898007e-05, + "loss": 0.8449, + "step": 1630 + }, + { + "epoch": 0.46, + "learning_rate": 4.3639995705193684e-05, + "loss": 0.8405, + "step": 1640 + }, + { + "epoch": 0.47, + "learning_rate": 4.3565719796604706e-05, + "loss": 0.8349, + "step": 1650 + }, + { + "epoch": 0.47, + "learning_rate": 4.3491076682293715e-05, + "loss": 0.8311, + "step": 1660 + }, + { + "epoch": 0.47, + "learning_rate": 4.341606783860416e-05, + "loss": 0.8383, + "step": 1670 + }, + { + "epoch": 0.48, + "learning_rate": 4.334069474911313e-05, + "loss": 0.8313, + "step": 1680 + }, + { + "epoch": 0.48, + "learning_rate": 4.326495890460204e-05, + "loss": 0.8424, + "step": 1690 + }, + { + "epoch": 0.48, + "learning_rate": 4.3188861803027094e-05, + "loss": 0.8323, + "step": 1700 + }, + { + "epoch": 0.48, + "learning_rate": 4.3112404949489715e-05, + "loss": 0.8501, + "step": 1710 + }, + { + "epoch": 0.49, + "learning_rate": 4.303558985620673e-05, + "loss": 0.8399, + "step": 1720 + }, + { + "epoch": 0.49, + "learning_rate": 4.2958418042480506e-05, + "loss": 0.8184, + "step": 1730 + }, + { + "epoch": 0.49, + "learning_rate": 4.288089103466886e-05, + "loss": 0.8418, + "step": 1740 + }, + { + "epoch": 0.5, + "learning_rate": 4.280301036615489e-05, + "loss": 0.828, + "step": 1750 + }, + { + "epoch": 0.5, + "learning_rate": 4.272477757731662e-05, + "loss": 0.836, + "step": 1760 + }, + { + "epoch": 0.5, + "learning_rate": 4.2646194215496595e-05, + "loss": 0.825, + "step": 1770 + }, + { + "epoch": 0.5, + "learning_rate": 4.2567261834971206e-05, + "loss": 0.8357, + "step": 1780 + }, + { + "epoch": 0.51, + "learning_rate": 4.248798199691998e-05, + "loss": 0.8498, + "step": 1790 + }, + { + "epoch": 0.51, + "learning_rate": 4.2408356269394714e-05, + "loss": 0.8361, + "step": 1800 + }, + { + "epoch": 0.51, + "learning_rate": 4.2328386227288445e-05, + "loss": 0.8237, + "step": 1810 + }, + { + "epoch": 0.52, + "learning_rate": 4.224807345230429e-05, + "loss": 0.8413, + "step": 1820 + }, + { + "epoch": 0.52, + "learning_rate": 4.21674195329242e-05, + "loss": 0.823, + "step": 1830 + }, + { + "epoch": 0.52, + "learning_rate": 4.208642606437748e-05, + "loss": 0.8501, + "step": 1840 + }, + { + "epoch": 0.52, + "learning_rate": 4.2005094648609325e-05, + "loss": 0.8372, + "step": 1850 + }, + { + "epoch": 0.53, + "learning_rate": 4.192342689424903e-05, + "loss": 0.8072, + "step": 1860 + }, + { + "epoch": 0.53, + "learning_rate": 4.184142441657827e-05, + "loss": 0.8409, + "step": 1870 + }, + { + "epoch": 0.53, + "learning_rate": 4.1759088837499095e-05, + "loss": 0.856, + "step": 1880 + }, + { + "epoch": 0.54, + "learning_rate": 4.167642178550186e-05, + "loss": 0.8428, + "step": 1890 + }, + { + "epoch": 0.54, + "learning_rate": 4.159342489563304e-05, + "loss": 0.8344, + "step": 1900 + }, + { + "epoch": 0.54, + "learning_rate": 4.151009980946287e-05, + "loss": 0.8317, + "step": 1910 + }, + { + "epoch": 0.54, + "learning_rate": 4.142644817505284e-05, + "loss": 0.8172, + "step": 1920 + }, + { + "epoch": 0.55, + "learning_rate": 4.1342471646923196e-05, + "loss": 0.8305, + "step": 1930 + }, + { + "epoch": 0.55, + "learning_rate": 4.1258171886020124e-05, + "loss": 0.8303, + "step": 1940 + }, + { + "epoch": 0.55, + "learning_rate": 4.117355055968295e-05, + "loss": 0.8292, + "step": 1950 + }, + { + "epoch": 0.55, + "learning_rate": 4.1088609341611135e-05, + "loss": 0.8162, + "step": 1960 + }, + { + "epoch": 0.56, + "learning_rate": 4.1003349911831166e-05, + "loss": 0.8344, + "step": 1970 + }, + { + "epoch": 0.56, + "learning_rate": 4.091777395666338e-05, + "loss": 0.8545, + "step": 1980 + }, + { + "epoch": 0.56, + "learning_rate": 4.0831883168688534e-05, + "loss": 0.8305, + "step": 1990 + }, + { + "epoch": 0.57, + "learning_rate": 4.07456792467144e-05, + "loss": 0.8365, + "step": 2000 + } + ], + "max_steps": 7064, + "num_train_epochs": 2, + "total_flos": 3.5864645752617697e+18, + "trial_name": null, + "trial_params": null +} diff --git a/sft-qlora/checkpoint-2000/training_args.bin b/sft-qlora/checkpoint-2000/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..e8bd5ea7554270f553d5441a16ce5f0105c78887 --- /dev/null +++ b/sft-qlora/checkpoint-2000/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:131cb9a8eab84a15c7b110e05a98a526550eba69b35fa4c758b43a4caafa6db7 +size 3275 diff --git a/sft-qlora/checkpoint-3000/README.md b/sft-qlora/checkpoint-3000/README.md new file mode 100644 index 0000000000000000000000000000000000000000..d290c902d52b2091d490255d35c9be86df84f437 --- /dev/null +++ b/sft-qlora/checkpoint-3000/README.md @@ -0,0 +1,3 @@ +--- +library_name: peft +--- diff --git a/sft-qlora/checkpoint-3000/adapter_config.json b/sft-qlora/checkpoint-3000/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..2ef4676864a7f782259cd6700dcab8059e8973ab --- /dev/null +++ b/sft-qlora/checkpoint-3000/adapter_config.json @@ -0,0 +1,20 @@ +{ + "base_model_name_or_path": "llama-13b-hf/", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layers_pattern": null, + "layers_to_transform": null, + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "revision": null, + "target_modules": [ + "q_proj", + "v_proj" + ], + "task_type": "CAUSAL_LM" +} \ No newline at end of file diff --git a/sft-qlora/checkpoint-3000/adapter_model.bin b/sft-qlora/checkpoint-3000/adapter_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..db4f38040720a555b115de0f402beac75468791c --- /dev/null +++ b/sft-qlora/checkpoint-3000/adapter_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29eae167f186afa909bdbb24d8a9244bcc1d8c36b131bc433ed765998804383f +size 26269517 diff --git a/sft-qlora/checkpoint-3000/finetuning_args.json b/sft-qlora/checkpoint-3000/finetuning_args.json new file mode 100644 index 0000000000000000000000000000000000000000..36a921b3eb84159ad54e7697e9d7d3e2fde38fec --- /dev/null +++ b/sft-qlora/checkpoint-3000/finetuning_args.json @@ -0,0 +1,13 @@ +{ + "finetuning_type": "lora", + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "lora_rank": 8, + "lora_target": [ + "q_proj", + "v_proj" + ], + "name_module_trainable": "mlp", + "num_hidden_layers": 32, + "num_layer_trainable": 3 +} diff --git a/sft-qlora/checkpoint-3000/optimizer.pt b/sft-qlora/checkpoint-3000/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..a62abb234e3724e8072d89cdd7034762f5bf20fc --- /dev/null +++ b/sft-qlora/checkpoint-3000/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:123ff8d0cbfe1d64e63af3bb570b45a07a45c9c82b763c749ccf40da87ffd025 +size 52562821 diff --git a/sft-qlora/checkpoint-3000/rng_state_0.pth b/sft-qlora/checkpoint-3000/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..b8452d3faaa8a76655031eba09ec2681ecaf0716 --- /dev/null +++ b/sft-qlora/checkpoint-3000/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34a7eb5b8e8df77a28bae52aab0825bbf464c442823a918c8ab23ef65981e021 +size 18679 diff --git a/sft-qlora/checkpoint-3000/rng_state_1.pth b/sft-qlora/checkpoint-3000/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..5fb8d272d882b95fd4ce5c9569c3cd938d58e91b --- /dev/null +++ b/sft-qlora/checkpoint-3000/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1631a5d40918fbf5f8ae222feb84849c1ede3edd65f16ee958ba249cf9aa97c +size 18679 diff --git a/sft-qlora/checkpoint-3000/rng_state_2.pth b/sft-qlora/checkpoint-3000/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..712a4258915fa36496ee996800a62762f6fe4091 --- /dev/null +++ b/sft-qlora/checkpoint-3000/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed7eeef1946d7c0d7991d091de6cd19ddde849be1517808f4a188ce2b388d40d +size 18679 diff --git a/sft-qlora/checkpoint-3000/rng_state_3.pth b/sft-qlora/checkpoint-3000/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..523092e5605a432b13312e5ea1a01056523855ff --- /dev/null +++ b/sft-qlora/checkpoint-3000/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7daeb6aa713d94eb58a4d49781817819edcb074368e56ca383283dd59f60ce0b +size 18679 diff --git a/sft-qlora/checkpoint-3000/scheduler.pt b/sft-qlora/checkpoint-3000/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..23c3cbe8a05547e4b38f4612b48acd2e829c9ecf --- /dev/null +++ b/sft-qlora/checkpoint-3000/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93b3f6531267b4bdbf5a6a0db75b0e9169e561b588905320233f1373d13e9940 +size 627 diff --git a/sft-qlora/checkpoint-3000/trainer_state.json b/sft-qlora/checkpoint-3000/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..bbbf715177e01d07d56d953b52be025fc3f6f223 --- /dev/null +++ b/sft-qlora/checkpoint-3000/trainer_state.json @@ -0,0 +1,1816 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 0.8493771234428086, + "global_step": 3000, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.0, + "learning_rate": 4.9999752766303955e-05, + "loss": 1.3185, + "step": 10 + }, + { + "epoch": 0.01, + "learning_rate": 4.999901107010577e-05, + "loss": 1.2795, + "step": 20 + }, + { + "epoch": 0.01, + "learning_rate": 4.999777492607524e-05, + "loss": 1.2266, + "step": 30 + }, + { + "epoch": 0.01, + "learning_rate": 4.9996044358661676e-05, + "loss": 1.19, + "step": 40 + }, + { + "epoch": 0.01, + "learning_rate": 4.9993819402093446e-05, + "loss": 1.1643, + "step": 50 + }, + { + "epoch": 0.02, + "learning_rate": 4.999110010037728e-05, + "loss": 1.1381, + "step": 60 + }, + { + "epoch": 0.02, + "learning_rate": 4.998788650729743e-05, + "loss": 1.1113, + "step": 70 + }, + { + "epoch": 0.02, + "learning_rate": 4.998417868641457e-05, + "loss": 1.0892, + "step": 80 + }, + { + "epoch": 0.03, + "learning_rate": 4.9979976711064556e-05, + "loss": 1.0801, + "step": 90 + }, + { + "epoch": 0.03, + "learning_rate": 4.9975280664357e-05, + "loss": 1.0822, + "step": 100 + }, + { + "epoch": 0.03, + "learning_rate": 4.997009063917356e-05, + "loss": 1.0794, + "step": 110 + }, + { + "epoch": 0.03, + "learning_rate": 4.996440673816617e-05, + "loss": 1.0419, + "step": 120 + }, + { + "epoch": 0.04, + "learning_rate": 4.995822907375498e-05, + "loss": 1.049, + "step": 130 + }, + { + "epoch": 0.04, + "learning_rate": 4.9951557768126136e-05, + "loss": 1.0202, + "step": 140 + }, + { + "epoch": 0.04, + "learning_rate": 4.9944392953229365e-05, + "loss": 1.0226, + "step": 150 + }, + { + "epoch": 0.05, + "learning_rate": 4.993673477077535e-05, + "loss": 0.9927, + "step": 160 + }, + { + "epoch": 0.05, + "learning_rate": 4.9928583372232954e-05, + "loss": 1.0006, + "step": 170 + }, + { + "epoch": 0.05, + "learning_rate": 4.991993891882622e-05, + "loss": 0.9999, + "step": 180 + }, + { + "epoch": 0.05, + "learning_rate": 4.991080158153115e-05, + "loss": 1.0003, + "step": 190 + }, + { + "epoch": 0.06, + "learning_rate": 4.990117154107236e-05, + "loss": 0.9875, + "step": 200 + }, + { + "epoch": 0.06, + "learning_rate": 4.989104898791949e-05, + "loss": 1.004, + "step": 210 + }, + { + "epoch": 0.06, + "learning_rate": 4.988043412228343e-05, + "loss": 0.9835, + "step": 220 + }, + { + "epoch": 0.07, + "learning_rate": 4.986932715411239e-05, + "loss": 0.9765, + "step": 230 + }, + { + "epoch": 0.07, + "learning_rate": 4.985772830308771e-05, + "loss": 0.9755, + "step": 240 + }, + { + "epoch": 0.07, + "learning_rate": 4.9845637798619536e-05, + "loss": 0.9798, + "step": 250 + }, + { + "epoch": 0.07, + "learning_rate": 4.983305587984227e-05, + "loss": 0.9779, + "step": 260 + }, + { + "epoch": 0.08, + "learning_rate": 4.981998279560986e-05, + "loss": 0.9707, + "step": 270 + }, + { + "epoch": 0.08, + "learning_rate": 4.980641880449086e-05, + "loss": 0.987, + "step": 280 + }, + { + "epoch": 0.08, + "learning_rate": 4.9792364174763323e-05, + "loss": 0.9493, + "step": 290 + }, + { + "epoch": 0.08, + "learning_rate": 4.977781918440949e-05, + "loss": 0.9701, + "step": 300 + }, + { + "epoch": 0.09, + "learning_rate": 4.97627841211103e-05, + "loss": 0.9476, + "step": 310 + }, + { + "epoch": 0.09, + "learning_rate": 4.97472592822397e-05, + "loss": 0.9218, + "step": 320 + }, + { + "epoch": 0.09, + "learning_rate": 4.9731244974858746e-05, + "loss": 0.9481, + "step": 330 + }, + { + "epoch": 0.1, + "learning_rate": 4.971474151570955e-05, + "loss": 0.9508, + "step": 340 + }, + { + "epoch": 0.1, + "learning_rate": 4.9697749231209025e-05, + "loss": 0.9587, + "step": 350 + }, + { + "epoch": 0.1, + "learning_rate": 4.968026845744237e-05, + "loss": 0.9371, + "step": 360 + }, + { + "epoch": 0.1, + "learning_rate": 4.96622995401565e-05, + "loss": 0.9242, + "step": 370 + }, + { + "epoch": 0.11, + "learning_rate": 4.9643842834753174e-05, + "loss": 0.9229, + "step": 380 + }, + { + "epoch": 0.11, + "learning_rate": 4.962489870628193e-05, + "loss": 0.9271, + "step": 390 + }, + { + "epoch": 0.11, + "learning_rate": 4.960546752943294e-05, + "loss": 0.9309, + "step": 400 + }, + { + "epoch": 0.12, + "learning_rate": 4.958554968852952e-05, + "loss": 0.9102, + "step": 410 + }, + { + "epoch": 0.12, + "learning_rate": 4.95651455775206e-05, + "loss": 0.9089, + "step": 420 + }, + { + "epoch": 0.12, + "learning_rate": 4.954425559997287e-05, + "loss": 0.9236, + "step": 430 + }, + { + "epoch": 0.12, + "learning_rate": 4.952288016906284e-05, + "loss": 0.9184, + "step": 440 + }, + { + "epoch": 0.13, + "learning_rate": 4.9501019707568665e-05, + "loss": 0.9112, + "step": 450 + }, + { + "epoch": 0.13, + "learning_rate": 4.947867464786174e-05, + "loss": 0.9178, + "step": 460 + }, + { + "epoch": 0.13, + "learning_rate": 4.945584543189823e-05, + "loss": 0.9364, + "step": 470 + }, + { + "epoch": 0.14, + "learning_rate": 4.943253251121022e-05, + "loss": 0.9262, + "step": 480 + }, + { + "epoch": 0.14, + "learning_rate": 4.9408736346896894e-05, + "loss": 0.9037, + "step": 490 + }, + { + "epoch": 0.14, + "learning_rate": 4.938445740961534e-05, + "loss": 0.928, + "step": 500 + }, + { + "epoch": 0.14, + "learning_rate": 4.935969617957126e-05, + "loss": 0.9064, + "step": 510 + }, + { + "epoch": 0.15, + "learning_rate": 4.93344531465095e-05, + "loss": 0.9107, + "step": 520 + }, + { + "epoch": 0.15, + "learning_rate": 4.930872880970432e-05, + "loss": 0.905, + "step": 530 + }, + { + "epoch": 0.15, + "learning_rate": 4.9282523677949556e-05, + "loss": 0.9234, + "step": 540 + }, + { + "epoch": 0.16, + "learning_rate": 4.9255838269548524e-05, + "loss": 0.906, + "step": 550 + }, + { + "epoch": 0.16, + "learning_rate": 4.9228673112303814e-05, + "loss": 0.8885, + "step": 560 + }, + { + "epoch": 0.16, + "learning_rate": 4.9201028743506794e-05, + "loss": 0.9103, + "step": 570 + }, + { + "epoch": 0.16, + "learning_rate": 4.917290570992702e-05, + "loss": 0.895, + "step": 580 + }, + { + "epoch": 0.17, + "learning_rate": 4.9144304567801415e-05, + "loss": 0.8948, + "step": 590 + }, + { + "epoch": 0.17, + "learning_rate": 4.911522588282327e-05, + "loss": 0.9109, + "step": 600 + }, + { + "epoch": 0.17, + "learning_rate": 4.908567023013104e-05, + "loss": 0.8914, + "step": 610 + }, + { + "epoch": 0.18, + "learning_rate": 4.9055638194296994e-05, + "loss": 0.892, + "step": 620 + }, + { + "epoch": 0.18, + "learning_rate": 4.902513036931562e-05, + "loss": 0.9049, + "step": 630 + }, + { + "epoch": 0.18, + "learning_rate": 4.89941473585919e-05, + "loss": 0.904, + "step": 640 + }, + { + "epoch": 0.18, + "learning_rate": 4.89626897749294e-05, + "loss": 0.8983, + "step": 650 + }, + { + "epoch": 0.19, + "learning_rate": 4.893075824051807e-05, + "loss": 0.8884, + "step": 660 + }, + { + "epoch": 0.19, + "learning_rate": 4.889835338692201e-05, + "loss": 0.8886, + "step": 670 + }, + { + "epoch": 0.19, + "learning_rate": 4.886547585506698e-05, + "loss": 0.8998, + "step": 680 + }, + { + "epoch": 0.2, + "learning_rate": 4.8832126295227656e-05, + "loss": 0.8753, + "step": 690 + }, + { + "epoch": 0.2, + "learning_rate": 4.879830536701485e-05, + "loss": 0.8937, + "step": 700 + }, + { + "epoch": 0.2, + "learning_rate": 4.876401373936239e-05, + "loss": 0.8921, + "step": 710 + }, + { + "epoch": 0.2, + "learning_rate": 4.8729252090513964e-05, + "loss": 0.8801, + "step": 720 + }, + { + "epoch": 0.21, + "learning_rate": 4.869402110800963e-05, + "loss": 0.8887, + "step": 730 + }, + { + "epoch": 0.21, + "learning_rate": 4.865832148867228e-05, + "loss": 0.8793, + "step": 740 + }, + { + "epoch": 0.21, + "learning_rate": 4.8622153938593816e-05, + "loss": 0.8811, + "step": 750 + }, + { + "epoch": 0.22, + "learning_rate": 4.8585519173121205e-05, + "loss": 0.8924, + "step": 760 + }, + { + "epoch": 0.22, + "learning_rate": 4.8548417916842324e-05, + "loss": 0.8988, + "step": 770 + }, + { + "epoch": 0.22, + "learning_rate": 4.851085090357163e-05, + "loss": 0.8907, + "step": 780 + }, + { + "epoch": 0.22, + "learning_rate": 4.847281887633565e-05, + "loss": 0.8879, + "step": 790 + }, + { + "epoch": 0.23, + "learning_rate": 4.843432258735827e-05, + "loss": 0.8796, + "step": 800 + }, + { + "epoch": 0.23, + "learning_rate": 4.839536279804589e-05, + "loss": 0.8965, + "step": 810 + }, + { + "epoch": 0.23, + "learning_rate": 4.835594027897231e-05, + "loss": 0.8678, + "step": 820 + }, + { + "epoch": 0.23, + "learning_rate": 4.831605580986355e-05, + "loss": 0.8857, + "step": 830 + }, + { + "epoch": 0.24, + "learning_rate": 4.8275710179582366e-05, + "loss": 0.8805, + "step": 840 + }, + { + "epoch": 0.24, + "learning_rate": 4.823490418611273e-05, + "loss": 0.865, + "step": 850 + }, + { + "epoch": 0.24, + "learning_rate": 4.819363863654395e-05, + "loss": 0.8892, + "step": 860 + }, + { + "epoch": 0.25, + "learning_rate": 4.8151914347054776e-05, + "loss": 0.8589, + "step": 870 + }, + { + "epoch": 0.25, + "learning_rate": 4.810973214289724e-05, + "loss": 0.8819, + "step": 880 + }, + { + "epoch": 0.25, + "learning_rate": 4.806709285838031e-05, + "loss": 0.8778, + "step": 890 + }, + { + "epoch": 0.25, + "learning_rate": 4.8023997336853434e-05, + "loss": 0.8725, + "step": 900 + }, + { + "epoch": 0.26, + "learning_rate": 4.7980446430689804e-05, + "loss": 0.8856, + "step": 910 + }, + { + "epoch": 0.26, + "learning_rate": 4.793644100126954e-05, + "loss": 0.8836, + "step": 920 + }, + { + "epoch": 0.26, + "learning_rate": 4.7891981918962656e-05, + "loss": 0.8684, + "step": 930 + }, + { + "epoch": 0.27, + "learning_rate": 4.784707006311179e-05, + "loss": 0.8671, + "step": 940 + }, + { + "epoch": 0.27, + "learning_rate": 4.780170632201487e-05, + "loss": 0.868, + "step": 950 + }, + { + "epoch": 0.27, + "learning_rate": 4.7755891592907556e-05, + "loss": 0.8683, + "step": 960 + }, + { + "epoch": 0.27, + "learning_rate": 4.7709626781945397e-05, + "loss": 0.8581, + "step": 970 + }, + { + "epoch": 0.28, + "learning_rate": 4.766291280418603e-05, + "loss": 0.8653, + "step": 980 + }, + { + "epoch": 0.28, + "learning_rate": 4.761575058357101e-05, + "loss": 0.8677, + "step": 990 + }, + { + "epoch": 0.28, + "learning_rate": 4.756814105290753e-05, + "loss": 0.8734, + "step": 1000 + }, + { + "epoch": 0.29, + "learning_rate": 4.7520085153850014e-05, + "loss": 0.8583, + "step": 1010 + }, + { + "epoch": 0.29, + "learning_rate": 4.7471583836881476e-05, + "loss": 0.874, + "step": 1020 + }, + { + "epoch": 0.29, + "learning_rate": 4.742263806129469e-05, + "loss": 0.8554, + "step": 1030 + }, + { + "epoch": 0.29, + "learning_rate": 4.737324879517326e-05, + "loss": 0.8807, + "step": 1040 + }, + { + "epoch": 0.3, + "learning_rate": 4.732341701537245e-05, + "loss": 0.8633, + "step": 1050 + }, + { + "epoch": 0.3, + "learning_rate": 4.727314370749988e-05, + "loss": 0.875, + "step": 1060 + }, + { + "epoch": 0.3, + "learning_rate": 4.7222429865896e-05, + "loss": 0.8709, + "step": 1070 + }, + { + "epoch": 0.31, + "learning_rate": 4.717127649361444e-05, + "loss": 0.8634, + "step": 1080 + }, + { + "epoch": 0.31, + "learning_rate": 4.71196846024022e-05, + "loss": 0.8566, + "step": 1090 + }, + { + "epoch": 0.31, + "learning_rate": 4.7067655212679585e-05, + "loss": 0.8667, + "step": 1100 + }, + { + "epoch": 0.31, + "learning_rate": 4.701518935352006e-05, + "loss": 0.8688, + "step": 1110 + }, + { + "epoch": 0.32, + "learning_rate": 4.69622880626299e-05, + "loss": 0.8573, + "step": 1120 + }, + { + "epoch": 0.32, + "learning_rate": 4.690895238632762e-05, + "loss": 0.8576, + "step": 1130 + }, + { + "epoch": 0.32, + "learning_rate": 4.685518337952335e-05, + "loss": 0.8525, + "step": 1140 + }, + { + "epoch": 0.33, + "learning_rate": 4.680098210569789e-05, + "loss": 0.8656, + "step": 1150 + }, + { + "epoch": 0.33, + "learning_rate": 4.674634963688177e-05, + "loss": 0.8703, + "step": 1160 + }, + { + "epoch": 0.33, + "learning_rate": 4.669128705363394e-05, + "loss": 0.8616, + "step": 1170 + }, + { + "epoch": 0.33, + "learning_rate": 4.663579544502049e-05, + "loss": 0.8677, + "step": 1180 + }, + { + "epoch": 0.34, + "learning_rate": 4.657987590859305e-05, + "loss": 0.8525, + "step": 1190 + }, + { + "epoch": 0.34, + "learning_rate": 4.652352955036713e-05, + "loss": 0.8526, + "step": 1200 + }, + { + "epoch": 0.34, + "learning_rate": 4.646675748480019e-05, + "loss": 0.8586, + "step": 1210 + }, + { + "epoch": 0.35, + "learning_rate": 4.640956083476964e-05, + "loss": 0.8542, + "step": 1220 + }, + { + "epoch": 0.35, + "learning_rate": 4.635194073155061e-05, + "loss": 0.8517, + "step": 1230 + }, + { + "epoch": 0.35, + "learning_rate": 4.62938983147936e-05, + "loss": 0.8592, + "step": 1240 + }, + { + "epoch": 0.35, + "learning_rate": 4.62354347325019e-05, + "loss": 0.8678, + "step": 1250 + }, + { + "epoch": 0.36, + "learning_rate": 4.6176551141008916e-05, + "loss": 0.8644, + "step": 1260 + }, + { + "epoch": 0.36, + "learning_rate": 4.611724870495528e-05, + "loss": 0.8541, + "step": 1270 + }, + { + "epoch": 0.36, + "learning_rate": 4.605752859726583e-05, + "loss": 0.8438, + "step": 1280 + }, + { + "epoch": 0.37, + "learning_rate": 4.5997391999126397e-05, + "loss": 0.8604, + "step": 1290 + }, + { + "epoch": 0.37, + "learning_rate": 4.5936840099960465e-05, + "loss": 0.8633, + "step": 1300 + }, + { + "epoch": 0.37, + "learning_rate": 4.587587409740561e-05, + "loss": 0.8437, + "step": 1310 + }, + { + "epoch": 0.37, + "learning_rate": 4.581449519728986e-05, + "loss": 0.8466, + "step": 1320 + }, + { + "epoch": 0.38, + "learning_rate": 4.575270461360779e-05, + "loss": 0.8457, + "step": 1330 + }, + { + "epoch": 0.38, + "learning_rate": 4.569050356849655e-05, + "loss": 0.8477, + "step": 1340 + }, + { + "epoch": 0.38, + "learning_rate": 4.562789329221169e-05, + "loss": 0.8608, + "step": 1350 + }, + { + "epoch": 0.39, + "learning_rate": 4.5564875023102796e-05, + "loss": 0.8555, + "step": 1360 + }, + { + "epoch": 0.39, + "learning_rate": 4.550145000758905e-05, + "loss": 0.8624, + "step": 1370 + }, + { + "epoch": 0.39, + "learning_rate": 4.543761950013453e-05, + "loss": 0.8613, + "step": 1380 + }, + { + "epoch": 0.39, + "learning_rate": 4.537338476322341e-05, + "loss": 0.849, + "step": 1390 + }, + { + "epoch": 0.4, + "learning_rate": 4.530874706733502e-05, + "loss": 0.858, + "step": 1400 + }, + { + "epoch": 0.4, + "learning_rate": 4.524370769091866e-05, + "loss": 0.8468, + "step": 1410 + }, + { + "epoch": 0.4, + "learning_rate": 4.5178267920368366e-05, + "loss": 0.8624, + "step": 1420 + }, + { + "epoch": 0.4, + "learning_rate": 4.511242904999746e-05, + "loss": 0.8464, + "step": 1430 + }, + { + "epoch": 0.41, + "learning_rate": 4.50461923820129e-05, + "loss": 0.8575, + "step": 1440 + }, + { + "epoch": 0.41, + "learning_rate": 4.497955922648961e-05, + "loss": 0.8587, + "step": 1450 + }, + { + "epoch": 0.41, + "learning_rate": 4.491253090134447e-05, + "loss": 0.8517, + "step": 1460 + }, + { + "epoch": 0.42, + "learning_rate": 4.4845108732310355e-05, + "loss": 0.8427, + "step": 1470 + }, + { + "epoch": 0.42, + "learning_rate": 4.4777294052909804e-05, + "loss": 0.8588, + "step": 1480 + }, + { + "epoch": 0.42, + "learning_rate": 4.470908820442873e-05, + "loss": 0.8516, + "step": 1490 + }, + { + "epoch": 0.42, + "learning_rate": 4.464049253588985e-05, + "loss": 0.8408, + "step": 1500 + }, + { + "epoch": 0.43, + "learning_rate": 4.457150840402604e-05, + "loss": 0.8513, + "step": 1510 + }, + { + "epoch": 0.43, + "learning_rate": 4.450213717325343e-05, + "loss": 0.8554, + "step": 1520 + }, + { + "epoch": 0.43, + "learning_rate": 4.443238021564448e-05, + "loss": 0.8598, + "step": 1530 + }, + { + "epoch": 0.44, + "learning_rate": 4.4362238910900835e-05, + "loss": 0.8495, + "step": 1540 + }, + { + "epoch": 0.44, + "learning_rate": 4.4291714646326024e-05, + "loss": 0.8338, + "step": 1550 + }, + { + "epoch": 0.44, + "learning_rate": 4.4220808816797995e-05, + "loss": 0.8576, + "step": 1560 + }, + { + "epoch": 0.44, + "learning_rate": 4.414952282474158e-05, + "loss": 0.8593, + "step": 1570 + }, + { + "epoch": 0.45, + "learning_rate": 4.407785808010073e-05, + "loss": 0.8534, + "step": 1580 + }, + { + "epoch": 0.45, + "learning_rate": 4.400581600031062e-05, + "loss": 0.8564, + "step": 1590 + }, + { + "epoch": 0.45, + "learning_rate": 4.3933398010269614e-05, + "loss": 0.8446, + "step": 1600 + }, + { + "epoch": 0.46, + "learning_rate": 4.386060554231111e-05, + "loss": 0.8445, + "step": 1610 + }, + { + "epoch": 0.46, + "learning_rate": 4.378744003617517e-05, + "loss": 0.8281, + "step": 1620 + }, + { + "epoch": 0.46, + "learning_rate": 4.371390293898007e-05, + "loss": 0.8449, + "step": 1630 + }, + { + "epoch": 0.46, + "learning_rate": 4.3639995705193684e-05, + "loss": 0.8405, + "step": 1640 + }, + { + "epoch": 0.47, + "learning_rate": 4.3565719796604706e-05, + "loss": 0.8349, + "step": 1650 + }, + { + "epoch": 0.47, + "learning_rate": 4.3491076682293715e-05, + "loss": 0.8311, + "step": 1660 + }, + { + "epoch": 0.47, + "learning_rate": 4.341606783860416e-05, + "loss": 0.8383, + "step": 1670 + }, + { + "epoch": 0.48, + "learning_rate": 4.334069474911313e-05, + "loss": 0.8313, + "step": 1680 + }, + { + "epoch": 0.48, + "learning_rate": 4.326495890460204e-05, + "loss": 0.8424, + "step": 1690 + }, + { + "epoch": 0.48, + "learning_rate": 4.3188861803027094e-05, + "loss": 0.8323, + "step": 1700 + }, + { + "epoch": 0.48, + "learning_rate": 4.3112404949489715e-05, + "loss": 0.8501, + "step": 1710 + }, + { + "epoch": 0.49, + "learning_rate": 4.303558985620673e-05, + "loss": 0.8399, + "step": 1720 + }, + { + "epoch": 0.49, + "learning_rate": 4.2958418042480506e-05, + "loss": 0.8184, + "step": 1730 + }, + { + "epoch": 0.49, + "learning_rate": 4.288089103466886e-05, + "loss": 0.8418, + "step": 1740 + }, + { + "epoch": 0.5, + "learning_rate": 4.280301036615489e-05, + "loss": 0.828, + "step": 1750 + }, + { + "epoch": 0.5, + "learning_rate": 4.272477757731662e-05, + "loss": 0.836, + "step": 1760 + }, + { + "epoch": 0.5, + "learning_rate": 4.2646194215496595e-05, + "loss": 0.825, + "step": 1770 + }, + { + "epoch": 0.5, + "learning_rate": 4.2567261834971206e-05, + "loss": 0.8357, + "step": 1780 + }, + { + "epoch": 0.51, + "learning_rate": 4.248798199691998e-05, + "loss": 0.8498, + "step": 1790 + }, + { + "epoch": 0.51, + "learning_rate": 4.2408356269394714e-05, + "loss": 0.8361, + "step": 1800 + }, + { + "epoch": 0.51, + "learning_rate": 4.2328386227288445e-05, + "loss": 0.8237, + "step": 1810 + }, + { + "epoch": 0.52, + "learning_rate": 4.224807345230429e-05, + "loss": 0.8413, + "step": 1820 + }, + { + "epoch": 0.52, + "learning_rate": 4.21674195329242e-05, + "loss": 0.823, + "step": 1830 + }, + { + "epoch": 0.52, + "learning_rate": 4.208642606437748e-05, + "loss": 0.8501, + "step": 1840 + }, + { + "epoch": 0.52, + "learning_rate": 4.2005094648609325e-05, + "loss": 0.8372, + "step": 1850 + }, + { + "epoch": 0.53, + "learning_rate": 4.192342689424903e-05, + "loss": 0.8072, + "step": 1860 + }, + { + "epoch": 0.53, + "learning_rate": 4.184142441657827e-05, + "loss": 0.8409, + "step": 1870 + }, + { + "epoch": 0.53, + "learning_rate": 4.1759088837499095e-05, + "loss": 0.856, + "step": 1880 + }, + { + "epoch": 0.54, + "learning_rate": 4.167642178550186e-05, + "loss": 0.8428, + "step": 1890 + }, + { + "epoch": 0.54, + "learning_rate": 4.159342489563304e-05, + "loss": 0.8344, + "step": 1900 + }, + { + "epoch": 0.54, + "learning_rate": 4.151009980946287e-05, + "loss": 0.8317, + "step": 1910 + }, + { + "epoch": 0.54, + "learning_rate": 4.142644817505284e-05, + "loss": 0.8172, + "step": 1920 + }, + { + "epoch": 0.55, + "learning_rate": 4.1342471646923196e-05, + "loss": 0.8305, + "step": 1930 + }, + { + "epoch": 0.55, + "learning_rate": 4.1258171886020124e-05, + "loss": 0.8303, + "step": 1940 + }, + { + "epoch": 0.55, + "learning_rate": 4.117355055968295e-05, + "loss": 0.8292, + "step": 1950 + }, + { + "epoch": 0.55, + "learning_rate": 4.1088609341611135e-05, + "loss": 0.8162, + "step": 1960 + }, + { + "epoch": 0.56, + "learning_rate": 4.1003349911831166e-05, + "loss": 0.8344, + "step": 1970 + }, + { + "epoch": 0.56, + "learning_rate": 4.091777395666338e-05, + "loss": 0.8545, + "step": 1980 + }, + { + "epoch": 0.56, + "learning_rate": 4.0831883168688534e-05, + "loss": 0.8305, + "step": 1990 + }, + { + "epoch": 0.57, + "learning_rate": 4.07456792467144e-05, + "loss": 0.8365, + "step": 2000 + }, + { + "epoch": 0.57, + "learning_rate": 4.065916389574211e-05, + "loss": 0.8375, + "step": 2010 + }, + { + "epoch": 0.57, + "learning_rate": 4.057233882693246e-05, + "loss": 0.8351, + "step": 2020 + }, + { + "epoch": 0.57, + "learning_rate": 4.048520575757207e-05, + "loss": 0.8165, + "step": 2030 + }, + { + "epoch": 0.58, + "learning_rate": 4.0397766411039395e-05, + "loss": 0.8194, + "step": 2040 + }, + { + "epoch": 0.58, + "learning_rate": 4.031002251677067e-05, + "loss": 0.8218, + "step": 2050 + }, + { + "epoch": 0.58, + "learning_rate": 4.022197581022567e-05, + "loss": 0.8203, + "step": 2060 + }, + { + "epoch": 0.59, + "learning_rate": 4.0133628032853435e-05, + "loss": 0.832, + "step": 2070 + }, + { + "epoch": 0.59, + "learning_rate": 4.004498093205773e-05, + "loss": 0.8066, + "step": 2080 + }, + { + "epoch": 0.59, + "learning_rate": 3.99560362611626e-05, + "loss": 0.8421, + "step": 2090 + }, + { + "epoch": 0.59, + "learning_rate": 3.986679577937762e-05, + "loss": 0.8217, + "step": 2100 + }, + { + "epoch": 0.6, + "learning_rate": 3.9777261251763145e-05, + "loss": 0.8268, + "step": 2110 + }, + { + "epoch": 0.6, + "learning_rate": 3.9687434449195316e-05, + "loss": 0.8321, + "step": 2120 + }, + { + "epoch": 0.6, + "learning_rate": 3.959731714833115e-05, + "loss": 0.8266, + "step": 2130 + }, + { + "epoch": 0.61, + "learning_rate": 3.95069111315733e-05, + "loss": 0.82, + "step": 2140 + }, + { + "epoch": 0.61, + "learning_rate": 3.9416218187034876e-05, + "loss": 0.8347, + "step": 2150 + }, + { + "epoch": 0.61, + "learning_rate": 3.9325240108504016e-05, + "loss": 0.8472, + "step": 2160 + }, + { + "epoch": 0.61, + "learning_rate": 3.923397869540845e-05, + "loss": 0.8092, + "step": 2170 + }, + { + "epoch": 0.62, + "learning_rate": 3.91424357527799e-05, + "loss": 0.8166, + "step": 2180 + }, + { + "epoch": 0.62, + "learning_rate": 3.905061309121837e-05, + "loss": 0.817, + "step": 2190 + }, + { + "epoch": 0.62, + "learning_rate": 3.895851252685634e-05, + "loss": 0.8073, + "step": 2200 + }, + { + "epoch": 0.63, + "learning_rate": 3.886613588132284e-05, + "loss": 0.8355, + "step": 2210 + }, + { + "epoch": 0.63, + "learning_rate": 3.877348498170743e-05, + "loss": 0.8232, + "step": 2220 + }, + { + "epoch": 0.63, + "learning_rate": 3.868056166052407e-05, + "loss": 0.8312, + "step": 2230 + }, + { + "epoch": 0.63, + "learning_rate": 3.858736775567484e-05, + "loss": 0.8215, + "step": 2240 + }, + { + "epoch": 0.64, + "learning_rate": 3.8493905110413626e-05, + "loss": 0.8263, + "step": 2250 + }, + { + "epoch": 0.64, + "learning_rate": 3.8400175573309646e-05, + "loss": 0.8282, + "step": 2260 + }, + { + "epoch": 0.64, + "learning_rate": 3.83061809982109e-05, + "loss": 0.8337, + "step": 2270 + }, + { + "epoch": 0.65, + "learning_rate": 3.821192324420747e-05, + "loss": 0.8291, + "step": 2280 + }, + { + "epoch": 0.65, + "learning_rate": 3.8117404175594795e-05, + "loss": 0.8444, + "step": 2290 + }, + { + "epoch": 0.65, + "learning_rate": 3.8022625661836775e-05, + "loss": 0.8063, + "step": 2300 + }, + { + "epoch": 0.65, + "learning_rate": 3.792758957752879e-05, + "loss": 0.825, + "step": 2310 + }, + { + "epoch": 0.66, + "learning_rate": 3.783229780236062e-05, + "loss": 0.8244, + "step": 2320 + }, + { + "epoch": 0.66, + "learning_rate": 3.773675222107929e-05, + "loss": 0.8086, + "step": 2330 + }, + { + "epoch": 0.66, + "learning_rate": 3.7640954723451784e-05, + "loss": 0.823, + "step": 2340 + }, + { + "epoch": 0.67, + "learning_rate": 3.7544907204227646e-05, + "loss": 0.8177, + "step": 2350 + }, + { + "epoch": 0.67, + "learning_rate": 3.7448611563101536e-05, + "loss": 0.8142, + "step": 2360 + }, + { + "epoch": 0.67, + "learning_rate": 3.735206970467564e-05, + "loss": 0.8236, + "step": 2370 + }, + { + "epoch": 0.67, + "learning_rate": 3.7255283538421984e-05, + "loss": 0.8169, + "step": 2380 + }, + { + "epoch": 0.68, + "learning_rate": 3.7158254978644703e-05, + "loss": 0.8143, + "step": 2390 + }, + { + "epoch": 0.68, + "learning_rate": 3.706098594444216e-05, + "loss": 0.8061, + "step": 2400 + }, + { + "epoch": 0.68, + "learning_rate": 3.6963478359668966e-05, + "loss": 0.8253, + "step": 2410 + }, + { + "epoch": 0.69, + "learning_rate": 3.6865734152897987e-05, + "loss": 0.812, + "step": 2420 + }, + { + "epoch": 0.69, + "learning_rate": 3.676775525738213e-05, + "loss": 0.8263, + "step": 2430 + }, + { + "epoch": 0.69, + "learning_rate": 3.666954361101616e-05, + "loss": 0.8144, + "step": 2440 + }, + { + "epoch": 0.69, + "learning_rate": 3.657110115629832e-05, + "loss": 0.8089, + "step": 2450 + }, + { + "epoch": 0.7, + "learning_rate": 3.647242984029201e-05, + "loss": 0.8155, + "step": 2460 + }, + { + "epoch": 0.7, + "learning_rate": 3.637353161458713e-05, + "loss": 0.8142, + "step": 2470 + }, + { + "epoch": 0.7, + "learning_rate": 3.627440843526158e-05, + "loss": 0.8192, + "step": 2480 + }, + { + "epoch": 0.7, + "learning_rate": 3.6175062262842585e-05, + "loss": 0.8134, + "step": 2490 + }, + { + "epoch": 0.71, + "learning_rate": 3.607549506226784e-05, + "loss": 0.8175, + "step": 2500 + }, + { + "epoch": 0.71, + "learning_rate": 3.5975708802846725e-05, + "loss": 0.8192, + "step": 2510 + }, + { + "epoch": 0.71, + "learning_rate": 3.587570545822128e-05, + "loss": 0.8348, + "step": 2520 + }, + { + "epoch": 0.72, + "learning_rate": 3.5775487006327215e-05, + "loss": 0.8147, + "step": 2530 + }, + { + "epoch": 0.72, + "learning_rate": 3.567505542935482e-05, + "loss": 0.8235, + "step": 2540 + }, + { + "epoch": 0.72, + "learning_rate": 3.557441271370968e-05, + "loss": 0.8175, + "step": 2550 + }, + { + "epoch": 0.72, + "learning_rate": 3.547356084997344e-05, + "loss": 0.8197, + "step": 2560 + }, + { + "epoch": 0.73, + "learning_rate": 3.537250183286443e-05, + "loss": 0.808, + "step": 2570 + }, + { + "epoch": 0.73, + "learning_rate": 3.527123766119818e-05, + "loss": 0.8154, + "step": 2580 + }, + { + "epoch": 0.73, + "learning_rate": 3.5169770337847935e-05, + "loss": 0.8104, + "step": 2590 + }, + { + "epoch": 0.74, + "learning_rate": 3.5068101869705004e-05, + "loss": 0.8318, + "step": 2600 + }, + { + "epoch": 0.74, + "learning_rate": 3.496623426763908e-05, + "loss": 0.8146, + "step": 2610 + }, + { + "epoch": 0.74, + "learning_rate": 3.486416954645846e-05, + "loss": 0.8097, + "step": 2620 + }, + { + "epoch": 0.74, + "learning_rate": 3.4761909724870205e-05, + "loss": 0.8176, + "step": 2630 + }, + { + "epoch": 0.75, + "learning_rate": 3.4659456825440216e-05, + "loss": 0.8284, + "step": 2640 + }, + { + "epoch": 0.75, + "learning_rate": 3.4556812874553204e-05, + "loss": 0.8159, + "step": 2650 + }, + { + "epoch": 0.75, + "learning_rate": 3.445397990237264e-05, + "loss": 0.8204, + "step": 2660 + }, + { + "epoch": 0.76, + "learning_rate": 3.4350959942800584e-05, + "loss": 0.8013, + "step": 2670 + }, + { + "epoch": 0.76, + "learning_rate": 3.424775503343747e-05, + "loss": 0.8196, + "step": 2680 + }, + { + "epoch": 0.76, + "learning_rate": 3.414436721554179e-05, + "loss": 0.802, + "step": 2690 + }, + { + "epoch": 0.76, + "learning_rate": 3.4040798533989745e-05, + "loss": 0.8204, + "step": 2700 + }, + { + "epoch": 0.77, + "learning_rate": 3.3937051037234745e-05, + "loss": 0.8055, + "step": 2710 + }, + { + "epoch": 0.77, + "learning_rate": 3.3833126777266974e-05, + "loss": 0.8171, + "step": 2720 + }, + { + "epoch": 0.77, + "learning_rate": 3.3729027809572735e-05, + "loss": 0.8222, + "step": 2730 + }, + { + "epoch": 0.78, + "learning_rate": 3.3624756193093835e-05, + "loss": 0.8104, + "step": 2740 + }, + { + "epoch": 0.78, + "learning_rate": 3.3520313990186856e-05, + "loss": 0.8147, + "step": 2750 + }, + { + "epoch": 0.78, + "learning_rate": 3.341570326658232e-05, + "loss": 0.8017, + "step": 2760 + }, + { + "epoch": 0.78, + "learning_rate": 3.331092609134392e-05, + "loss": 0.8059, + "step": 2770 + }, + { + "epoch": 0.79, + "learning_rate": 3.32059845368275e-05, + "loss": 0.8204, + "step": 2780 + }, + { + "epoch": 0.79, + "learning_rate": 3.310088067864015e-05, + "loss": 0.812, + "step": 2790 + }, + { + "epoch": 0.79, + "learning_rate": 3.299561659559909e-05, + "loss": 0.8087, + "step": 2800 + }, + { + "epoch": 0.8, + "learning_rate": 3.289019436969057e-05, + "loss": 0.8038, + "step": 2810 + }, + { + "epoch": 0.8, + "learning_rate": 3.278461608602873e-05, + "loss": 0.8094, + "step": 2820 + }, + { + "epoch": 0.8, + "learning_rate": 3.267888383281431e-05, + "loss": 0.8182, + "step": 2830 + }, + { + "epoch": 0.8, + "learning_rate": 3.257299970129336e-05, + "loss": 0.812, + "step": 2840 + }, + { + "epoch": 0.81, + "learning_rate": 3.246696578571592e-05, + "loss": 0.809, + "step": 2850 + }, + { + "epoch": 0.81, + "learning_rate": 3.236078418329452e-05, + "loss": 0.8288, + "step": 2860 + }, + { + "epoch": 0.81, + "learning_rate": 3.225445699416276e-05, + "loss": 0.808, + "step": 2870 + }, + { + "epoch": 0.82, + "learning_rate": 3.214798632133376e-05, + "loss": 0.8127, + "step": 2880 + }, + { + "epoch": 0.82, + "learning_rate": 3.204137427065857e-05, + "loss": 0.8159, + "step": 2890 + }, + { + "epoch": 0.82, + "learning_rate": 3.193462295078448e-05, + "loss": 0.819, + "step": 2900 + }, + { + "epoch": 0.82, + "learning_rate": 3.1827734473113356e-05, + "loss": 0.8108, + "step": 2910 + }, + { + "epoch": 0.83, + "learning_rate": 3.172071095175989e-05, + "loss": 0.8199, + "step": 2920 + }, + { + "epoch": 0.83, + "learning_rate": 3.1613554503509715e-05, + "loss": 0.7977, + "step": 2930 + }, + { + "epoch": 0.83, + "learning_rate": 3.1506267247777645e-05, + "loss": 0.8171, + "step": 2940 + }, + { + "epoch": 0.84, + "learning_rate": 3.139885130656563e-05, + "loss": 0.8064, + "step": 2950 + }, + { + "epoch": 0.84, + "learning_rate": 3.129130880442091e-05, + "loss": 0.8087, + "step": 2960 + }, + { + "epoch": 0.84, + "learning_rate": 3.118364186839389e-05, + "loss": 0.8023, + "step": 2970 + }, + { + "epoch": 0.84, + "learning_rate": 3.107585262799613e-05, + "loss": 0.7978, + "step": 2980 + }, + { + "epoch": 0.85, + "learning_rate": 3.096794321515823e-05, + "loss": 0.8268, + "step": 2990 + }, + { + "epoch": 0.85, + "learning_rate": 3.0859915764187616e-05, + "loss": 0.8129, + "step": 3000 + } + ], + "max_steps": 7064, + "num_train_epochs": 2, + "total_flos": 5.381823572857586e+18, + "trial_name": null, + "trial_params": null +} diff --git a/sft-qlora/checkpoint-3000/training_args.bin b/sft-qlora/checkpoint-3000/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..e8bd5ea7554270f553d5441a16ce5f0105c78887 --- /dev/null +++ b/sft-qlora/checkpoint-3000/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:131cb9a8eab84a15c7b110e05a98a526550eba69b35fa4c758b43a4caafa6db7 +size 3275 diff --git a/sft-qlora/checkpoint-4000/README.md b/sft-qlora/checkpoint-4000/README.md new file mode 100644 index 0000000000000000000000000000000000000000..d290c902d52b2091d490255d35c9be86df84f437 --- /dev/null +++ b/sft-qlora/checkpoint-4000/README.md @@ -0,0 +1,3 @@ +--- +library_name: peft +--- diff --git a/sft-qlora/checkpoint-4000/adapter_config.json b/sft-qlora/checkpoint-4000/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..2ef4676864a7f782259cd6700dcab8059e8973ab --- /dev/null +++ b/sft-qlora/checkpoint-4000/adapter_config.json @@ -0,0 +1,20 @@ +{ + "base_model_name_or_path": "llama-13b-hf/", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layers_pattern": null, + "layers_to_transform": null, + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "revision": null, + "target_modules": [ + "q_proj", + "v_proj" + ], + "task_type": "CAUSAL_LM" +} \ No newline at end of file diff --git a/sft-qlora/checkpoint-4000/adapter_model.bin b/sft-qlora/checkpoint-4000/adapter_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..ed1dfb134b3b8916c5e86bdcbc45aeeffd8f720a --- /dev/null +++ b/sft-qlora/checkpoint-4000/adapter_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75c284bc513ebad80b72570c4ac6b38a8a6e4c16b2fe56a1869db3c7fcddfca7 +size 26269517 diff --git a/sft-qlora/checkpoint-4000/finetuning_args.json b/sft-qlora/checkpoint-4000/finetuning_args.json new file mode 100644 index 0000000000000000000000000000000000000000..36a921b3eb84159ad54e7697e9d7d3e2fde38fec --- /dev/null +++ b/sft-qlora/checkpoint-4000/finetuning_args.json @@ -0,0 +1,13 @@ +{ + "finetuning_type": "lora", + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "lora_rank": 8, + "lora_target": [ + "q_proj", + "v_proj" + ], + "name_module_trainable": "mlp", + "num_hidden_layers": 32, + "num_layer_trainable": 3 +} diff --git a/sft-qlora/checkpoint-4000/optimizer.pt b/sft-qlora/checkpoint-4000/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9aa2dfc4d457c95e809d1a6e0b19dc48ee7a793 --- /dev/null +++ b/sft-qlora/checkpoint-4000/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a0e8a249d87882d5dc9c651cfdf334af22f56b73827937afc626636add3b111 +size 52562821 diff --git a/sft-qlora/checkpoint-4000/rng_state_0.pth b/sft-qlora/checkpoint-4000/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..3767665ccfb89290b870aca38b4ff390d5a94306 --- /dev/null +++ b/sft-qlora/checkpoint-4000/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5978240c798217567b7409b3e3c7de5f7291e7ae6eb4c309423593affef4653b +size 18679 diff --git a/sft-qlora/checkpoint-4000/rng_state_1.pth b/sft-qlora/checkpoint-4000/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..f6e40d09f3e4e39f635158cffb8df47fa3f46a40 --- /dev/null +++ b/sft-qlora/checkpoint-4000/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f64f4894fc31ab7c0c49ae19facf802bebc8846340239b23a7ad9f2f7a0e1d1a +size 18679 diff --git a/sft-qlora/checkpoint-4000/rng_state_2.pth b/sft-qlora/checkpoint-4000/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..f9e9f58f17b641ff0e3d9da55d8d48899d005921 --- /dev/null +++ b/sft-qlora/checkpoint-4000/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b7ded5e4425f3a43a00810873c05393ff8acafce3f3347f9b2a6673dbaa1939 +size 18679 diff --git a/sft-qlora/checkpoint-4000/rng_state_3.pth b/sft-qlora/checkpoint-4000/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..ebaab8b29c2507ada6c2782d4b725caa8ec483b6 --- /dev/null +++ b/sft-qlora/checkpoint-4000/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0cb9df962e1207e2a5858e2bcf9d6f4123a9a9f636f71f15d2d6dca8f8248092 +size 18679 diff --git a/sft-qlora/checkpoint-4000/scheduler.pt b/sft-qlora/checkpoint-4000/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a2d33d284e4848bd18d8934b7e240129b62bf4d --- /dev/null +++ b/sft-qlora/checkpoint-4000/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:faf7e35bc1d9d6e77c904ac697970bf3fe9271b75c118e224f479ab9fa296d48 +size 627 diff --git a/sft-qlora/checkpoint-4000/trainer_state.json b/sft-qlora/checkpoint-4000/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..c09be18edac73421131715aea368c5b60cba58dd --- /dev/null +++ b/sft-qlora/checkpoint-4000/trainer_state.json @@ -0,0 +1,2416 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 1.1325028312570782, + "global_step": 4000, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.0, + "learning_rate": 4.9999752766303955e-05, + "loss": 1.3185, + "step": 10 + }, + { + "epoch": 0.01, + "learning_rate": 4.999901107010577e-05, + "loss": 1.2795, + "step": 20 + }, + { + "epoch": 0.01, + "learning_rate": 4.999777492607524e-05, + "loss": 1.2266, + "step": 30 + }, + { + "epoch": 0.01, + "learning_rate": 4.9996044358661676e-05, + "loss": 1.19, + "step": 40 + }, + { + "epoch": 0.01, + "learning_rate": 4.9993819402093446e-05, + "loss": 1.1643, + "step": 50 + }, + { + "epoch": 0.02, + "learning_rate": 4.999110010037728e-05, + "loss": 1.1381, + "step": 60 + }, + { + "epoch": 0.02, + "learning_rate": 4.998788650729743e-05, + "loss": 1.1113, + "step": 70 + }, + { + "epoch": 0.02, + "learning_rate": 4.998417868641457e-05, + "loss": 1.0892, + "step": 80 + }, + { + "epoch": 0.03, + "learning_rate": 4.9979976711064556e-05, + "loss": 1.0801, + "step": 90 + }, + { + "epoch": 0.03, + "learning_rate": 4.9975280664357e-05, + "loss": 1.0822, + "step": 100 + }, + { + "epoch": 0.03, + "learning_rate": 4.997009063917356e-05, + "loss": 1.0794, + "step": 110 + }, + { + "epoch": 0.03, + "learning_rate": 4.996440673816617e-05, + "loss": 1.0419, + "step": 120 + }, + { + "epoch": 0.04, + "learning_rate": 4.995822907375498e-05, + "loss": 1.049, + "step": 130 + }, + { + "epoch": 0.04, + "learning_rate": 4.9951557768126136e-05, + "loss": 1.0202, + "step": 140 + }, + { + "epoch": 0.04, + "learning_rate": 4.9944392953229365e-05, + "loss": 1.0226, + "step": 150 + }, + { + "epoch": 0.05, + "learning_rate": 4.993673477077535e-05, + "loss": 0.9927, + "step": 160 + }, + { + "epoch": 0.05, + "learning_rate": 4.9928583372232954e-05, + "loss": 1.0006, + "step": 170 + }, + { + "epoch": 0.05, + "learning_rate": 4.991993891882622e-05, + "loss": 0.9999, + "step": 180 + }, + { + "epoch": 0.05, + "learning_rate": 4.991080158153115e-05, + "loss": 1.0003, + "step": 190 + }, + { + "epoch": 0.06, + "learning_rate": 4.990117154107236e-05, + "loss": 0.9875, + "step": 200 + }, + { + "epoch": 0.06, + "learning_rate": 4.989104898791949e-05, + "loss": 1.004, + "step": 210 + }, + { + "epoch": 0.06, + "learning_rate": 4.988043412228343e-05, + "loss": 0.9835, + "step": 220 + }, + { + "epoch": 0.07, + "learning_rate": 4.986932715411239e-05, + "loss": 0.9765, + "step": 230 + }, + { + "epoch": 0.07, + "learning_rate": 4.985772830308771e-05, + "loss": 0.9755, + "step": 240 + }, + { + "epoch": 0.07, + "learning_rate": 4.9845637798619536e-05, + "loss": 0.9798, + "step": 250 + }, + { + "epoch": 0.07, + "learning_rate": 4.983305587984227e-05, + "loss": 0.9779, + "step": 260 + }, + { + "epoch": 0.08, + "learning_rate": 4.981998279560986e-05, + "loss": 0.9707, + "step": 270 + }, + { + "epoch": 0.08, + "learning_rate": 4.980641880449086e-05, + "loss": 0.987, + "step": 280 + }, + { + "epoch": 0.08, + "learning_rate": 4.9792364174763323e-05, + "loss": 0.9493, + "step": 290 + }, + { + "epoch": 0.08, + "learning_rate": 4.977781918440949e-05, + "loss": 0.9701, + "step": 300 + }, + { + "epoch": 0.09, + "learning_rate": 4.97627841211103e-05, + "loss": 0.9476, + "step": 310 + }, + { + "epoch": 0.09, + "learning_rate": 4.97472592822397e-05, + "loss": 0.9218, + "step": 320 + }, + { + "epoch": 0.09, + "learning_rate": 4.9731244974858746e-05, + "loss": 0.9481, + "step": 330 + }, + { + "epoch": 0.1, + "learning_rate": 4.971474151570955e-05, + "loss": 0.9508, + "step": 340 + }, + { + "epoch": 0.1, + "learning_rate": 4.9697749231209025e-05, + "loss": 0.9587, + "step": 350 + }, + { + "epoch": 0.1, + "learning_rate": 4.968026845744237e-05, + "loss": 0.9371, + "step": 360 + }, + { + "epoch": 0.1, + "learning_rate": 4.96622995401565e-05, + "loss": 0.9242, + "step": 370 + }, + { + "epoch": 0.11, + "learning_rate": 4.9643842834753174e-05, + "loss": 0.9229, + "step": 380 + }, + { + "epoch": 0.11, + "learning_rate": 4.962489870628193e-05, + "loss": 0.9271, + "step": 390 + }, + { + "epoch": 0.11, + "learning_rate": 4.960546752943294e-05, + "loss": 0.9309, + "step": 400 + }, + { + "epoch": 0.12, + "learning_rate": 4.958554968852952e-05, + "loss": 0.9102, + "step": 410 + }, + { + "epoch": 0.12, + "learning_rate": 4.95651455775206e-05, + "loss": 0.9089, + "step": 420 + }, + { + "epoch": 0.12, + "learning_rate": 4.954425559997287e-05, + "loss": 0.9236, + "step": 430 + }, + { + "epoch": 0.12, + "learning_rate": 4.952288016906284e-05, + "loss": 0.9184, + "step": 440 + }, + { + "epoch": 0.13, + "learning_rate": 4.9501019707568665e-05, + "loss": 0.9112, + "step": 450 + }, + { + "epoch": 0.13, + "learning_rate": 4.947867464786174e-05, + "loss": 0.9178, + "step": 460 + }, + { + "epoch": 0.13, + "learning_rate": 4.945584543189823e-05, + "loss": 0.9364, + "step": 470 + }, + { + "epoch": 0.14, + "learning_rate": 4.943253251121022e-05, + "loss": 0.9262, + "step": 480 + }, + { + "epoch": 0.14, + "learning_rate": 4.9408736346896894e-05, + "loss": 0.9037, + "step": 490 + }, + { + "epoch": 0.14, + "learning_rate": 4.938445740961534e-05, + "loss": 0.928, + "step": 500 + }, + { + "epoch": 0.14, + "learning_rate": 4.935969617957126e-05, + "loss": 0.9064, + "step": 510 + }, + { + "epoch": 0.15, + "learning_rate": 4.93344531465095e-05, + "loss": 0.9107, + "step": 520 + }, + { + "epoch": 0.15, + "learning_rate": 4.930872880970432e-05, + "loss": 0.905, + "step": 530 + }, + { + "epoch": 0.15, + "learning_rate": 4.9282523677949556e-05, + "loss": 0.9234, + "step": 540 + }, + { + "epoch": 0.16, + "learning_rate": 4.9255838269548524e-05, + "loss": 0.906, + "step": 550 + }, + { + "epoch": 0.16, + "learning_rate": 4.9228673112303814e-05, + "loss": 0.8885, + "step": 560 + }, + { + "epoch": 0.16, + "learning_rate": 4.9201028743506794e-05, + "loss": 0.9103, + "step": 570 + }, + { + "epoch": 0.16, + "learning_rate": 4.917290570992702e-05, + "loss": 0.895, + "step": 580 + }, + { + "epoch": 0.17, + "learning_rate": 4.9144304567801415e-05, + "loss": 0.8948, + "step": 590 + }, + { + "epoch": 0.17, + "learning_rate": 4.911522588282327e-05, + "loss": 0.9109, + "step": 600 + }, + { + "epoch": 0.17, + "learning_rate": 4.908567023013104e-05, + "loss": 0.8914, + "step": 610 + }, + { + "epoch": 0.18, + "learning_rate": 4.9055638194296994e-05, + "loss": 0.892, + "step": 620 + }, + { + "epoch": 0.18, + "learning_rate": 4.902513036931562e-05, + "loss": 0.9049, + "step": 630 + }, + { + "epoch": 0.18, + "learning_rate": 4.89941473585919e-05, + "loss": 0.904, + "step": 640 + }, + { + "epoch": 0.18, + "learning_rate": 4.89626897749294e-05, + "loss": 0.8983, + "step": 650 + }, + { + "epoch": 0.19, + "learning_rate": 4.893075824051807e-05, + "loss": 0.8884, + "step": 660 + }, + { + "epoch": 0.19, + "learning_rate": 4.889835338692201e-05, + "loss": 0.8886, + "step": 670 + }, + { + "epoch": 0.19, + "learning_rate": 4.886547585506698e-05, + "loss": 0.8998, + "step": 680 + }, + { + "epoch": 0.2, + "learning_rate": 4.8832126295227656e-05, + "loss": 0.8753, + "step": 690 + }, + { + "epoch": 0.2, + "learning_rate": 4.879830536701485e-05, + "loss": 0.8937, + "step": 700 + }, + { + "epoch": 0.2, + "learning_rate": 4.876401373936239e-05, + "loss": 0.8921, + "step": 710 + }, + { + "epoch": 0.2, + "learning_rate": 4.8729252090513964e-05, + "loss": 0.8801, + "step": 720 + }, + { + "epoch": 0.21, + "learning_rate": 4.869402110800963e-05, + "loss": 0.8887, + "step": 730 + }, + { + "epoch": 0.21, + "learning_rate": 4.865832148867228e-05, + "loss": 0.8793, + "step": 740 + }, + { + "epoch": 0.21, + "learning_rate": 4.8622153938593816e-05, + "loss": 0.8811, + "step": 750 + }, + { + "epoch": 0.22, + "learning_rate": 4.8585519173121205e-05, + "loss": 0.8924, + "step": 760 + }, + { + "epoch": 0.22, + "learning_rate": 4.8548417916842324e-05, + "loss": 0.8988, + "step": 770 + }, + { + "epoch": 0.22, + "learning_rate": 4.851085090357163e-05, + "loss": 0.8907, + "step": 780 + }, + { + "epoch": 0.22, + "learning_rate": 4.847281887633565e-05, + "loss": 0.8879, + "step": 790 + }, + { + "epoch": 0.23, + "learning_rate": 4.843432258735827e-05, + "loss": 0.8796, + "step": 800 + }, + { + "epoch": 0.23, + "learning_rate": 4.839536279804589e-05, + "loss": 0.8965, + "step": 810 + }, + { + "epoch": 0.23, + "learning_rate": 4.835594027897231e-05, + "loss": 0.8678, + "step": 820 + }, + { + "epoch": 0.23, + "learning_rate": 4.831605580986355e-05, + "loss": 0.8857, + "step": 830 + }, + { + "epoch": 0.24, + "learning_rate": 4.8275710179582366e-05, + "loss": 0.8805, + "step": 840 + }, + { + "epoch": 0.24, + "learning_rate": 4.823490418611273e-05, + "loss": 0.865, + "step": 850 + }, + { + "epoch": 0.24, + "learning_rate": 4.819363863654395e-05, + "loss": 0.8892, + "step": 860 + }, + { + "epoch": 0.25, + "learning_rate": 4.8151914347054776e-05, + "loss": 0.8589, + "step": 870 + }, + { + "epoch": 0.25, + "learning_rate": 4.810973214289724e-05, + "loss": 0.8819, + "step": 880 + }, + { + "epoch": 0.25, + "learning_rate": 4.806709285838031e-05, + "loss": 0.8778, + "step": 890 + }, + { + "epoch": 0.25, + "learning_rate": 4.8023997336853434e-05, + "loss": 0.8725, + "step": 900 + }, + { + "epoch": 0.26, + "learning_rate": 4.7980446430689804e-05, + "loss": 0.8856, + "step": 910 + }, + { + "epoch": 0.26, + "learning_rate": 4.793644100126954e-05, + "loss": 0.8836, + "step": 920 + }, + { + "epoch": 0.26, + "learning_rate": 4.7891981918962656e-05, + "loss": 0.8684, + "step": 930 + }, + { + "epoch": 0.27, + "learning_rate": 4.784707006311179e-05, + "loss": 0.8671, + "step": 940 + }, + { + "epoch": 0.27, + "learning_rate": 4.780170632201487e-05, + "loss": 0.868, + "step": 950 + }, + { + "epoch": 0.27, + "learning_rate": 4.7755891592907556e-05, + "loss": 0.8683, + "step": 960 + }, + { + "epoch": 0.27, + "learning_rate": 4.7709626781945397e-05, + "loss": 0.8581, + "step": 970 + }, + { + "epoch": 0.28, + "learning_rate": 4.766291280418603e-05, + "loss": 0.8653, + "step": 980 + }, + { + "epoch": 0.28, + "learning_rate": 4.761575058357101e-05, + "loss": 0.8677, + "step": 990 + }, + { + "epoch": 0.28, + "learning_rate": 4.756814105290753e-05, + "loss": 0.8734, + "step": 1000 + }, + { + "epoch": 0.29, + "learning_rate": 4.7520085153850014e-05, + "loss": 0.8583, + "step": 1010 + }, + { + "epoch": 0.29, + "learning_rate": 4.7471583836881476e-05, + "loss": 0.874, + "step": 1020 + }, + { + "epoch": 0.29, + "learning_rate": 4.742263806129469e-05, + "loss": 0.8554, + "step": 1030 + }, + { + "epoch": 0.29, + "learning_rate": 4.737324879517326e-05, + "loss": 0.8807, + "step": 1040 + }, + { + "epoch": 0.3, + "learning_rate": 4.732341701537245e-05, + "loss": 0.8633, + "step": 1050 + }, + { + "epoch": 0.3, + "learning_rate": 4.727314370749988e-05, + "loss": 0.875, + "step": 1060 + }, + { + "epoch": 0.3, + "learning_rate": 4.7222429865896e-05, + "loss": 0.8709, + "step": 1070 + }, + { + "epoch": 0.31, + "learning_rate": 4.717127649361444e-05, + "loss": 0.8634, + "step": 1080 + }, + { + "epoch": 0.31, + "learning_rate": 4.71196846024022e-05, + "loss": 0.8566, + "step": 1090 + }, + { + "epoch": 0.31, + "learning_rate": 4.7067655212679585e-05, + "loss": 0.8667, + "step": 1100 + }, + { + "epoch": 0.31, + "learning_rate": 4.701518935352006e-05, + "loss": 0.8688, + "step": 1110 + }, + { + "epoch": 0.32, + "learning_rate": 4.69622880626299e-05, + "loss": 0.8573, + "step": 1120 + }, + { + "epoch": 0.32, + "learning_rate": 4.690895238632762e-05, + "loss": 0.8576, + "step": 1130 + }, + { + "epoch": 0.32, + "learning_rate": 4.685518337952335e-05, + "loss": 0.8525, + "step": 1140 + }, + { + "epoch": 0.33, + "learning_rate": 4.680098210569789e-05, + "loss": 0.8656, + "step": 1150 + }, + { + "epoch": 0.33, + "learning_rate": 4.674634963688177e-05, + "loss": 0.8703, + "step": 1160 + }, + { + "epoch": 0.33, + "learning_rate": 4.669128705363394e-05, + "loss": 0.8616, + "step": 1170 + }, + { + "epoch": 0.33, + "learning_rate": 4.663579544502049e-05, + "loss": 0.8677, + "step": 1180 + }, + { + "epoch": 0.34, + "learning_rate": 4.657987590859305e-05, + "loss": 0.8525, + "step": 1190 + }, + { + "epoch": 0.34, + "learning_rate": 4.652352955036713e-05, + "loss": 0.8526, + "step": 1200 + }, + { + "epoch": 0.34, + "learning_rate": 4.646675748480019e-05, + "loss": 0.8586, + "step": 1210 + }, + { + "epoch": 0.35, + "learning_rate": 4.640956083476964e-05, + "loss": 0.8542, + "step": 1220 + }, + { + "epoch": 0.35, + "learning_rate": 4.635194073155061e-05, + "loss": 0.8517, + "step": 1230 + }, + { + "epoch": 0.35, + "learning_rate": 4.62938983147936e-05, + "loss": 0.8592, + "step": 1240 + }, + { + "epoch": 0.35, + "learning_rate": 4.62354347325019e-05, + "loss": 0.8678, + "step": 1250 + }, + { + "epoch": 0.36, + "learning_rate": 4.6176551141008916e-05, + "loss": 0.8644, + "step": 1260 + }, + { + "epoch": 0.36, + "learning_rate": 4.611724870495528e-05, + "loss": 0.8541, + "step": 1270 + }, + { + "epoch": 0.36, + "learning_rate": 4.605752859726583e-05, + "loss": 0.8438, + "step": 1280 + }, + { + "epoch": 0.37, + "learning_rate": 4.5997391999126397e-05, + "loss": 0.8604, + "step": 1290 + }, + { + "epoch": 0.37, + "learning_rate": 4.5936840099960465e-05, + "loss": 0.8633, + "step": 1300 + }, + { + "epoch": 0.37, + "learning_rate": 4.587587409740561e-05, + "loss": 0.8437, + "step": 1310 + }, + { + "epoch": 0.37, + "learning_rate": 4.581449519728986e-05, + "loss": 0.8466, + "step": 1320 + }, + { + "epoch": 0.38, + "learning_rate": 4.575270461360779e-05, + "loss": 0.8457, + "step": 1330 + }, + { + "epoch": 0.38, + "learning_rate": 4.569050356849655e-05, + "loss": 0.8477, + "step": 1340 + }, + { + "epoch": 0.38, + "learning_rate": 4.562789329221169e-05, + "loss": 0.8608, + "step": 1350 + }, + { + "epoch": 0.39, + "learning_rate": 4.5564875023102796e-05, + "loss": 0.8555, + "step": 1360 + }, + { + "epoch": 0.39, + "learning_rate": 4.550145000758905e-05, + "loss": 0.8624, + "step": 1370 + }, + { + "epoch": 0.39, + "learning_rate": 4.543761950013453e-05, + "loss": 0.8613, + "step": 1380 + }, + { + "epoch": 0.39, + "learning_rate": 4.537338476322341e-05, + "loss": 0.849, + "step": 1390 + }, + { + "epoch": 0.4, + "learning_rate": 4.530874706733502e-05, + "loss": 0.858, + "step": 1400 + }, + { + "epoch": 0.4, + "learning_rate": 4.524370769091866e-05, + "loss": 0.8468, + "step": 1410 + }, + { + "epoch": 0.4, + "learning_rate": 4.5178267920368366e-05, + "loss": 0.8624, + "step": 1420 + }, + { + "epoch": 0.4, + "learning_rate": 4.511242904999746e-05, + "loss": 0.8464, + "step": 1430 + }, + { + "epoch": 0.41, + "learning_rate": 4.50461923820129e-05, + "loss": 0.8575, + "step": 1440 + }, + { + "epoch": 0.41, + "learning_rate": 4.497955922648961e-05, + "loss": 0.8587, + "step": 1450 + }, + { + "epoch": 0.41, + "learning_rate": 4.491253090134447e-05, + "loss": 0.8517, + "step": 1460 + }, + { + "epoch": 0.42, + "learning_rate": 4.4845108732310355e-05, + "loss": 0.8427, + "step": 1470 + }, + { + "epoch": 0.42, + "learning_rate": 4.4777294052909804e-05, + "loss": 0.8588, + "step": 1480 + }, + { + "epoch": 0.42, + "learning_rate": 4.470908820442873e-05, + "loss": 0.8516, + "step": 1490 + }, + { + "epoch": 0.42, + "learning_rate": 4.464049253588985e-05, + "loss": 0.8408, + "step": 1500 + }, + { + "epoch": 0.43, + "learning_rate": 4.457150840402604e-05, + "loss": 0.8513, + "step": 1510 + }, + { + "epoch": 0.43, + "learning_rate": 4.450213717325343e-05, + "loss": 0.8554, + "step": 1520 + }, + { + "epoch": 0.43, + "learning_rate": 4.443238021564448e-05, + "loss": 0.8598, + "step": 1530 + }, + { + "epoch": 0.44, + "learning_rate": 4.4362238910900835e-05, + "loss": 0.8495, + "step": 1540 + }, + { + "epoch": 0.44, + "learning_rate": 4.4291714646326024e-05, + "loss": 0.8338, + "step": 1550 + }, + { + "epoch": 0.44, + "learning_rate": 4.4220808816797995e-05, + "loss": 0.8576, + "step": 1560 + }, + { + "epoch": 0.44, + "learning_rate": 4.414952282474158e-05, + "loss": 0.8593, + "step": 1570 + }, + { + "epoch": 0.45, + "learning_rate": 4.407785808010073e-05, + "loss": 0.8534, + "step": 1580 + }, + { + "epoch": 0.45, + "learning_rate": 4.400581600031062e-05, + "loss": 0.8564, + "step": 1590 + }, + { + "epoch": 0.45, + "learning_rate": 4.3933398010269614e-05, + "loss": 0.8446, + "step": 1600 + }, + { + "epoch": 0.46, + "learning_rate": 4.386060554231111e-05, + "loss": 0.8445, + "step": 1610 + }, + { + "epoch": 0.46, + "learning_rate": 4.378744003617517e-05, + "loss": 0.8281, + "step": 1620 + }, + { + "epoch": 0.46, + "learning_rate": 4.371390293898007e-05, + "loss": 0.8449, + "step": 1630 + }, + { + "epoch": 0.46, + "learning_rate": 4.3639995705193684e-05, + "loss": 0.8405, + "step": 1640 + }, + { + "epoch": 0.47, + "learning_rate": 4.3565719796604706e-05, + "loss": 0.8349, + "step": 1650 + }, + { + "epoch": 0.47, + "learning_rate": 4.3491076682293715e-05, + "loss": 0.8311, + "step": 1660 + }, + { + "epoch": 0.47, + "learning_rate": 4.341606783860416e-05, + "loss": 0.8383, + "step": 1670 + }, + { + "epoch": 0.48, + "learning_rate": 4.334069474911313e-05, + "loss": 0.8313, + "step": 1680 + }, + { + "epoch": 0.48, + "learning_rate": 4.326495890460204e-05, + "loss": 0.8424, + "step": 1690 + }, + { + "epoch": 0.48, + "learning_rate": 4.3188861803027094e-05, + "loss": 0.8323, + "step": 1700 + }, + { + "epoch": 0.48, + "learning_rate": 4.3112404949489715e-05, + "loss": 0.8501, + "step": 1710 + }, + { + "epoch": 0.49, + "learning_rate": 4.303558985620673e-05, + "loss": 0.8399, + "step": 1720 + }, + { + "epoch": 0.49, + "learning_rate": 4.2958418042480506e-05, + "loss": 0.8184, + "step": 1730 + }, + { + "epoch": 0.49, + "learning_rate": 4.288089103466886e-05, + "loss": 0.8418, + "step": 1740 + }, + { + "epoch": 0.5, + "learning_rate": 4.280301036615489e-05, + "loss": 0.828, + "step": 1750 + }, + { + "epoch": 0.5, + "learning_rate": 4.272477757731662e-05, + "loss": 0.836, + "step": 1760 + }, + { + "epoch": 0.5, + "learning_rate": 4.2646194215496595e-05, + "loss": 0.825, + "step": 1770 + }, + { + "epoch": 0.5, + "learning_rate": 4.2567261834971206e-05, + "loss": 0.8357, + "step": 1780 + }, + { + "epoch": 0.51, + "learning_rate": 4.248798199691998e-05, + "loss": 0.8498, + "step": 1790 + }, + { + "epoch": 0.51, + "learning_rate": 4.2408356269394714e-05, + "loss": 0.8361, + "step": 1800 + }, + { + "epoch": 0.51, + "learning_rate": 4.2328386227288445e-05, + "loss": 0.8237, + "step": 1810 + }, + { + "epoch": 0.52, + "learning_rate": 4.224807345230429e-05, + "loss": 0.8413, + "step": 1820 + }, + { + "epoch": 0.52, + "learning_rate": 4.21674195329242e-05, + "loss": 0.823, + "step": 1830 + }, + { + "epoch": 0.52, + "learning_rate": 4.208642606437748e-05, + "loss": 0.8501, + "step": 1840 + }, + { + "epoch": 0.52, + "learning_rate": 4.2005094648609325e-05, + "loss": 0.8372, + "step": 1850 + }, + { + "epoch": 0.53, + "learning_rate": 4.192342689424903e-05, + "loss": 0.8072, + "step": 1860 + }, + { + "epoch": 0.53, + "learning_rate": 4.184142441657827e-05, + "loss": 0.8409, + "step": 1870 + }, + { + "epoch": 0.53, + "learning_rate": 4.1759088837499095e-05, + "loss": 0.856, + "step": 1880 + }, + { + "epoch": 0.54, + "learning_rate": 4.167642178550186e-05, + "loss": 0.8428, + "step": 1890 + }, + { + "epoch": 0.54, + "learning_rate": 4.159342489563304e-05, + "loss": 0.8344, + "step": 1900 + }, + { + "epoch": 0.54, + "learning_rate": 4.151009980946287e-05, + "loss": 0.8317, + "step": 1910 + }, + { + "epoch": 0.54, + "learning_rate": 4.142644817505284e-05, + "loss": 0.8172, + "step": 1920 + }, + { + "epoch": 0.55, + "learning_rate": 4.1342471646923196e-05, + "loss": 0.8305, + "step": 1930 + }, + { + "epoch": 0.55, + "learning_rate": 4.1258171886020124e-05, + "loss": 0.8303, + "step": 1940 + }, + { + "epoch": 0.55, + "learning_rate": 4.117355055968295e-05, + "loss": 0.8292, + "step": 1950 + }, + { + "epoch": 0.55, + "learning_rate": 4.1088609341611135e-05, + "loss": 0.8162, + "step": 1960 + }, + { + "epoch": 0.56, + "learning_rate": 4.1003349911831166e-05, + "loss": 0.8344, + "step": 1970 + }, + { + "epoch": 0.56, + "learning_rate": 4.091777395666338e-05, + "loss": 0.8545, + "step": 1980 + }, + { + "epoch": 0.56, + "learning_rate": 4.0831883168688534e-05, + "loss": 0.8305, + "step": 1990 + }, + { + "epoch": 0.57, + "learning_rate": 4.07456792467144e-05, + "loss": 0.8365, + "step": 2000 + }, + { + "epoch": 0.57, + "learning_rate": 4.065916389574211e-05, + "loss": 0.8375, + "step": 2010 + }, + { + "epoch": 0.57, + "learning_rate": 4.057233882693246e-05, + "loss": 0.8351, + "step": 2020 + }, + { + "epoch": 0.57, + "learning_rate": 4.048520575757207e-05, + "loss": 0.8165, + "step": 2030 + }, + { + "epoch": 0.58, + "learning_rate": 4.0397766411039395e-05, + "loss": 0.8194, + "step": 2040 + }, + { + "epoch": 0.58, + "learning_rate": 4.031002251677067e-05, + "loss": 0.8218, + "step": 2050 + }, + { + "epoch": 0.58, + "learning_rate": 4.022197581022567e-05, + "loss": 0.8203, + "step": 2060 + }, + { + "epoch": 0.59, + "learning_rate": 4.0133628032853435e-05, + "loss": 0.832, + "step": 2070 + }, + { + "epoch": 0.59, + "learning_rate": 4.004498093205773e-05, + "loss": 0.8066, + "step": 2080 + }, + { + "epoch": 0.59, + "learning_rate": 3.99560362611626e-05, + "loss": 0.8421, + "step": 2090 + }, + { + "epoch": 0.59, + "learning_rate": 3.986679577937762e-05, + "loss": 0.8217, + "step": 2100 + }, + { + "epoch": 0.6, + "learning_rate": 3.9777261251763145e-05, + "loss": 0.8268, + "step": 2110 + }, + { + "epoch": 0.6, + "learning_rate": 3.9687434449195316e-05, + "loss": 0.8321, + "step": 2120 + }, + { + "epoch": 0.6, + "learning_rate": 3.959731714833115e-05, + "loss": 0.8266, + "step": 2130 + }, + { + "epoch": 0.61, + "learning_rate": 3.95069111315733e-05, + "loss": 0.82, + "step": 2140 + }, + { + "epoch": 0.61, + "learning_rate": 3.9416218187034876e-05, + "loss": 0.8347, + "step": 2150 + }, + { + "epoch": 0.61, + "learning_rate": 3.9325240108504016e-05, + "loss": 0.8472, + "step": 2160 + }, + { + "epoch": 0.61, + "learning_rate": 3.923397869540845e-05, + "loss": 0.8092, + "step": 2170 + }, + { + "epoch": 0.62, + "learning_rate": 3.91424357527799e-05, + "loss": 0.8166, + "step": 2180 + }, + { + "epoch": 0.62, + "learning_rate": 3.905061309121837e-05, + "loss": 0.817, + "step": 2190 + }, + { + "epoch": 0.62, + "learning_rate": 3.895851252685634e-05, + "loss": 0.8073, + "step": 2200 + }, + { + "epoch": 0.63, + "learning_rate": 3.886613588132284e-05, + "loss": 0.8355, + "step": 2210 + }, + { + "epoch": 0.63, + "learning_rate": 3.877348498170743e-05, + "loss": 0.8232, + "step": 2220 + }, + { + "epoch": 0.63, + "learning_rate": 3.868056166052407e-05, + "loss": 0.8312, + "step": 2230 + }, + { + "epoch": 0.63, + "learning_rate": 3.858736775567484e-05, + "loss": 0.8215, + "step": 2240 + }, + { + "epoch": 0.64, + "learning_rate": 3.8493905110413626e-05, + "loss": 0.8263, + "step": 2250 + }, + { + "epoch": 0.64, + "learning_rate": 3.8400175573309646e-05, + "loss": 0.8282, + "step": 2260 + }, + { + "epoch": 0.64, + "learning_rate": 3.83061809982109e-05, + "loss": 0.8337, + "step": 2270 + }, + { + "epoch": 0.65, + "learning_rate": 3.821192324420747e-05, + "loss": 0.8291, + "step": 2280 + }, + { + "epoch": 0.65, + "learning_rate": 3.8117404175594795e-05, + "loss": 0.8444, + "step": 2290 + }, + { + "epoch": 0.65, + "learning_rate": 3.8022625661836775e-05, + "loss": 0.8063, + "step": 2300 + }, + { + "epoch": 0.65, + "learning_rate": 3.792758957752879e-05, + "loss": 0.825, + "step": 2310 + }, + { + "epoch": 0.66, + "learning_rate": 3.783229780236062e-05, + "loss": 0.8244, + "step": 2320 + }, + { + "epoch": 0.66, + "learning_rate": 3.773675222107929e-05, + "loss": 0.8086, + "step": 2330 + }, + { + "epoch": 0.66, + "learning_rate": 3.7640954723451784e-05, + "loss": 0.823, + "step": 2340 + }, + { + "epoch": 0.67, + "learning_rate": 3.7544907204227646e-05, + "loss": 0.8177, + "step": 2350 + }, + { + "epoch": 0.67, + "learning_rate": 3.7448611563101536e-05, + "loss": 0.8142, + "step": 2360 + }, + { + "epoch": 0.67, + "learning_rate": 3.735206970467564e-05, + "loss": 0.8236, + "step": 2370 + }, + { + "epoch": 0.67, + "learning_rate": 3.7255283538421984e-05, + "loss": 0.8169, + "step": 2380 + }, + { + "epoch": 0.68, + "learning_rate": 3.7158254978644703e-05, + "loss": 0.8143, + "step": 2390 + }, + { + "epoch": 0.68, + "learning_rate": 3.706098594444216e-05, + "loss": 0.8061, + "step": 2400 + }, + { + "epoch": 0.68, + "learning_rate": 3.6963478359668966e-05, + "loss": 0.8253, + "step": 2410 + }, + { + "epoch": 0.69, + "learning_rate": 3.6865734152897987e-05, + "loss": 0.812, + "step": 2420 + }, + { + "epoch": 0.69, + "learning_rate": 3.676775525738213e-05, + "loss": 0.8263, + "step": 2430 + }, + { + "epoch": 0.69, + "learning_rate": 3.666954361101616e-05, + "loss": 0.8144, + "step": 2440 + }, + { + "epoch": 0.69, + "learning_rate": 3.657110115629832e-05, + "loss": 0.8089, + "step": 2450 + }, + { + "epoch": 0.7, + "learning_rate": 3.647242984029201e-05, + "loss": 0.8155, + "step": 2460 + }, + { + "epoch": 0.7, + "learning_rate": 3.637353161458713e-05, + "loss": 0.8142, + "step": 2470 + }, + { + "epoch": 0.7, + "learning_rate": 3.627440843526158e-05, + "loss": 0.8192, + "step": 2480 + }, + { + "epoch": 0.7, + "learning_rate": 3.6175062262842585e-05, + "loss": 0.8134, + "step": 2490 + }, + { + "epoch": 0.71, + "learning_rate": 3.607549506226784e-05, + "loss": 0.8175, + "step": 2500 + }, + { + "epoch": 0.71, + "learning_rate": 3.5975708802846725e-05, + "loss": 0.8192, + "step": 2510 + }, + { + "epoch": 0.71, + "learning_rate": 3.587570545822128e-05, + "loss": 0.8348, + "step": 2520 + }, + { + "epoch": 0.72, + "learning_rate": 3.5775487006327215e-05, + "loss": 0.8147, + "step": 2530 + }, + { + "epoch": 0.72, + "learning_rate": 3.567505542935482e-05, + "loss": 0.8235, + "step": 2540 + }, + { + "epoch": 0.72, + "learning_rate": 3.557441271370968e-05, + "loss": 0.8175, + "step": 2550 + }, + { + "epoch": 0.72, + "learning_rate": 3.547356084997344e-05, + "loss": 0.8197, + "step": 2560 + }, + { + "epoch": 0.73, + "learning_rate": 3.537250183286443e-05, + "loss": 0.808, + "step": 2570 + }, + { + "epoch": 0.73, + "learning_rate": 3.527123766119818e-05, + "loss": 0.8154, + "step": 2580 + }, + { + "epoch": 0.73, + "learning_rate": 3.5169770337847935e-05, + "loss": 0.8104, + "step": 2590 + }, + { + "epoch": 0.74, + "learning_rate": 3.5068101869705004e-05, + "loss": 0.8318, + "step": 2600 + }, + { + "epoch": 0.74, + "learning_rate": 3.496623426763908e-05, + "loss": 0.8146, + "step": 2610 + }, + { + "epoch": 0.74, + "learning_rate": 3.486416954645846e-05, + "loss": 0.8097, + "step": 2620 + }, + { + "epoch": 0.74, + "learning_rate": 3.4761909724870205e-05, + "loss": 0.8176, + "step": 2630 + }, + { + "epoch": 0.75, + "learning_rate": 3.4659456825440216e-05, + "loss": 0.8284, + "step": 2640 + }, + { + "epoch": 0.75, + "learning_rate": 3.4556812874553204e-05, + "loss": 0.8159, + "step": 2650 + }, + { + "epoch": 0.75, + "learning_rate": 3.445397990237264e-05, + "loss": 0.8204, + "step": 2660 + }, + { + "epoch": 0.76, + "learning_rate": 3.4350959942800584e-05, + "loss": 0.8013, + "step": 2670 + }, + { + "epoch": 0.76, + "learning_rate": 3.424775503343747e-05, + "loss": 0.8196, + "step": 2680 + }, + { + "epoch": 0.76, + "learning_rate": 3.414436721554179e-05, + "loss": 0.802, + "step": 2690 + }, + { + "epoch": 0.76, + "learning_rate": 3.4040798533989745e-05, + "loss": 0.8204, + "step": 2700 + }, + { + "epoch": 0.77, + "learning_rate": 3.3937051037234745e-05, + "loss": 0.8055, + "step": 2710 + }, + { + "epoch": 0.77, + "learning_rate": 3.3833126777266974e-05, + "loss": 0.8171, + "step": 2720 + }, + { + "epoch": 0.77, + "learning_rate": 3.3729027809572735e-05, + "loss": 0.8222, + "step": 2730 + }, + { + "epoch": 0.78, + "learning_rate": 3.3624756193093835e-05, + "loss": 0.8104, + "step": 2740 + }, + { + "epoch": 0.78, + "learning_rate": 3.3520313990186856e-05, + "loss": 0.8147, + "step": 2750 + }, + { + "epoch": 0.78, + "learning_rate": 3.341570326658232e-05, + "loss": 0.8017, + "step": 2760 + }, + { + "epoch": 0.78, + "learning_rate": 3.331092609134392e-05, + "loss": 0.8059, + "step": 2770 + }, + { + "epoch": 0.79, + "learning_rate": 3.32059845368275e-05, + "loss": 0.8204, + "step": 2780 + }, + { + "epoch": 0.79, + "learning_rate": 3.310088067864015e-05, + "loss": 0.812, + "step": 2790 + }, + { + "epoch": 0.79, + "learning_rate": 3.299561659559909e-05, + "loss": 0.8087, + "step": 2800 + }, + { + "epoch": 0.8, + "learning_rate": 3.289019436969057e-05, + "loss": 0.8038, + "step": 2810 + }, + { + "epoch": 0.8, + "learning_rate": 3.278461608602873e-05, + "loss": 0.8094, + "step": 2820 + }, + { + "epoch": 0.8, + "learning_rate": 3.267888383281431e-05, + "loss": 0.8182, + "step": 2830 + }, + { + "epoch": 0.8, + "learning_rate": 3.257299970129336e-05, + "loss": 0.812, + "step": 2840 + }, + { + "epoch": 0.81, + "learning_rate": 3.246696578571592e-05, + "loss": 0.809, + "step": 2850 + }, + { + "epoch": 0.81, + "learning_rate": 3.236078418329452e-05, + "loss": 0.8288, + "step": 2860 + }, + { + "epoch": 0.81, + "learning_rate": 3.225445699416276e-05, + "loss": 0.808, + "step": 2870 + }, + { + "epoch": 0.82, + "learning_rate": 3.214798632133376e-05, + "loss": 0.8127, + "step": 2880 + }, + { + "epoch": 0.82, + "learning_rate": 3.204137427065857e-05, + "loss": 0.8159, + "step": 2890 + }, + { + "epoch": 0.82, + "learning_rate": 3.193462295078448e-05, + "loss": 0.819, + "step": 2900 + }, + { + "epoch": 0.82, + "learning_rate": 3.1827734473113356e-05, + "loss": 0.8108, + "step": 2910 + }, + { + "epoch": 0.83, + "learning_rate": 3.172071095175989e-05, + "loss": 0.8199, + "step": 2920 + }, + { + "epoch": 0.83, + "learning_rate": 3.1613554503509715e-05, + "loss": 0.7977, + "step": 2930 + }, + { + "epoch": 0.83, + "learning_rate": 3.1506267247777645e-05, + "loss": 0.8171, + "step": 2940 + }, + { + "epoch": 0.84, + "learning_rate": 3.139885130656563e-05, + "loss": 0.8064, + "step": 2950 + }, + { + "epoch": 0.84, + "learning_rate": 3.129130880442091e-05, + "loss": 0.8087, + "step": 2960 + }, + { + "epoch": 0.84, + "learning_rate": 3.118364186839389e-05, + "loss": 0.8023, + "step": 2970 + }, + { + "epoch": 0.84, + "learning_rate": 3.107585262799613e-05, + "loss": 0.7978, + "step": 2980 + }, + { + "epoch": 0.85, + "learning_rate": 3.096794321515823e-05, + "loss": 0.8268, + "step": 2990 + }, + { + "epoch": 0.85, + "learning_rate": 3.0859915764187616e-05, + "loss": 0.8129, + "step": 3000 + }, + { + "epoch": 0.85, + "learning_rate": 3.075177241172637e-05, + "loss": 0.8121, + "step": 3010 + }, + { + "epoch": 0.86, + "learning_rate": 3.064351529670895e-05, + "loss": 0.8018, + "step": 3020 + }, + { + "epoch": 0.86, + "learning_rate": 3.0535146560319895e-05, + "loss": 0.8191, + "step": 3030 + }, + { + "epoch": 0.86, + "learning_rate": 3.0426668345951448e-05, + "loss": 0.813, + "step": 3040 + }, + { + "epoch": 0.86, + "learning_rate": 3.031808279916121e-05, + "loss": 0.8252, + "step": 3050 + }, + { + "epoch": 0.87, + "learning_rate": 3.0209392067629676e-05, + "loss": 0.7995, + "step": 3060 + }, + { + "epoch": 0.87, + "learning_rate": 3.010059830111773e-05, + "loss": 0.8162, + "step": 3070 + }, + { + "epoch": 0.87, + "learning_rate": 2.9991703651424184e-05, + "loss": 0.8175, + "step": 3080 + }, + { + "epoch": 0.87, + "learning_rate": 2.988271027234317e-05, + "loss": 0.8076, + "step": 3090 + }, + { + "epoch": 0.88, + "learning_rate": 2.977362031962158e-05, + "loss": 0.8063, + "step": 3100 + }, + { + "epoch": 0.88, + "learning_rate": 2.966443595091637e-05, + "loss": 0.8159, + "step": 3110 + }, + { + "epoch": 0.88, + "learning_rate": 2.9555159325751947e-05, + "loss": 0.8083, + "step": 3120 + }, + { + "epoch": 0.89, + "learning_rate": 2.9445792605477433e-05, + "loss": 0.807, + "step": 3130 + }, + { + "epoch": 0.89, + "learning_rate": 2.933633795322391e-05, + "loss": 0.8123, + "step": 3140 + }, + { + "epoch": 0.89, + "learning_rate": 2.9226797533861615e-05, + "loss": 0.8107, + "step": 3150 + }, + { + "epoch": 0.89, + "learning_rate": 2.9117173513957186e-05, + "loss": 0.8053, + "step": 3160 + }, + { + "epoch": 0.9, + "learning_rate": 2.900746806173074e-05, + "loss": 0.8068, + "step": 3170 + }, + { + "epoch": 0.9, + "learning_rate": 2.889768334701305e-05, + "loss": 0.8086, + "step": 3180 + }, + { + "epoch": 0.9, + "learning_rate": 2.8787821541202564e-05, + "loss": 0.8042, + "step": 3190 + }, + { + "epoch": 0.91, + "learning_rate": 2.8677884817222505e-05, + "loss": 0.8019, + "step": 3200 + }, + { + "epoch": 0.91, + "learning_rate": 2.856787534947789e-05, + "loss": 0.8117, + "step": 3210 + }, + { + "epoch": 0.91, + "learning_rate": 2.8457795313812507e-05, + "loss": 0.8243, + "step": 3220 + }, + { + "epoch": 0.91, + "learning_rate": 2.8347646887465867e-05, + "loss": 0.7953, + "step": 3230 + }, + { + "epoch": 0.92, + "learning_rate": 2.8237432249030183e-05, + "loss": 0.8042, + "step": 3240 + }, + { + "epoch": 0.92, + "learning_rate": 2.812715357840725e-05, + "loss": 0.799, + "step": 3250 + }, + { + "epoch": 0.92, + "learning_rate": 2.801681305676534e-05, + "loss": 0.8093, + "step": 3260 + }, + { + "epoch": 0.93, + "learning_rate": 2.7906412866496034e-05, + "loss": 0.8048, + "step": 3270 + }, + { + "epoch": 0.93, + "learning_rate": 2.7795955191171114e-05, + "loss": 0.8116, + "step": 3280 + }, + { + "epoch": 0.93, + "learning_rate": 2.7685442215499323e-05, + "loss": 0.8151, + "step": 3290 + }, + { + "epoch": 0.93, + "learning_rate": 2.7574876125283176e-05, + "loss": 0.8017, + "step": 3300 + }, + { + "epoch": 0.94, + "learning_rate": 2.7464259107375722e-05, + "loss": 0.8051, + "step": 3310 + }, + { + "epoch": 0.94, + "learning_rate": 2.7353593349637297e-05, + "loss": 0.803, + "step": 3320 + }, + { + "epoch": 0.94, + "learning_rate": 2.7242881040892255e-05, + "loss": 0.8094, + "step": 3330 + }, + { + "epoch": 0.95, + "learning_rate": 2.713212437088564e-05, + "loss": 0.8186, + "step": 3340 + }, + { + "epoch": 0.95, + "learning_rate": 2.702132553023993e-05, + "loss": 0.8041, + "step": 3350 + }, + { + "epoch": 0.95, + "learning_rate": 2.691048671041169e-05, + "loss": 0.8009, + "step": 3360 + }, + { + "epoch": 0.95, + "learning_rate": 2.6799610103648197e-05, + "loss": 0.7931, + "step": 3370 + }, + { + "epoch": 0.96, + "learning_rate": 2.668869790294411e-05, + "loss": 0.8001, + "step": 3380 + }, + { + "epoch": 0.96, + "learning_rate": 2.6577752301998098e-05, + "loss": 0.8167, + "step": 3390 + }, + { + "epoch": 0.96, + "learning_rate": 2.6466775495169437e-05, + "loss": 0.8114, + "step": 3400 + }, + { + "epoch": 0.97, + "learning_rate": 2.6355769677434628e-05, + "loss": 0.8026, + "step": 3410 + }, + { + "epoch": 0.97, + "learning_rate": 2.6244737044343954e-05, + "loss": 0.8063, + "step": 3420 + }, + { + "epoch": 0.97, + "learning_rate": 2.6133679791978065e-05, + "loss": 0.8087, + "step": 3430 + }, + { + "epoch": 0.97, + "learning_rate": 2.602260011690457e-05, + "loss": 0.812, + "step": 3440 + }, + { + "epoch": 0.98, + "learning_rate": 2.591150021613456e-05, + "loss": 0.7899, + "step": 3450 + }, + { + "epoch": 0.98, + "learning_rate": 2.580038228707916e-05, + "loss": 0.798, + "step": 3460 + }, + { + "epoch": 0.98, + "learning_rate": 2.568924852750607e-05, + "loss": 0.826, + "step": 3470 + }, + { + "epoch": 0.99, + "learning_rate": 2.55781011354961e-05, + "loss": 0.8111, + "step": 3480 + }, + { + "epoch": 0.99, + "learning_rate": 2.5466942309399706e-05, + "loss": 0.7924, + "step": 3490 + }, + { + "epoch": 0.99, + "learning_rate": 2.535577424779347e-05, + "loss": 0.8001, + "step": 3500 + }, + { + "epoch": 0.99, + "learning_rate": 2.5244599149436642e-05, + "loss": 0.7906, + "step": 3510 + }, + { + "epoch": 1.0, + "learning_rate": 2.5133419213227684e-05, + "loss": 0.804, + "step": 3520 + }, + { + "epoch": 1.0, + "learning_rate": 2.5022236638160712e-05, + "loss": 0.8123, + "step": 3530 + }, + { + "epoch": 1.0, + "learning_rate": 2.491105362328204e-05, + "loss": 0.8164, + "step": 3540 + }, + { + "epoch": 1.01, + "learning_rate": 2.4799872367646685e-05, + "loss": 0.8169, + "step": 3550 + }, + { + "epoch": 1.01, + "learning_rate": 2.468869507027486e-05, + "loss": 0.7835, + "step": 3560 + }, + { + "epoch": 1.01, + "learning_rate": 2.457752393010851e-05, + "loss": 0.8199, + "step": 3570 + }, + { + "epoch": 1.01, + "learning_rate": 2.4466361145967782e-05, + "loss": 0.8096, + "step": 3580 + }, + { + "epoch": 1.02, + "learning_rate": 2.4355208916507554e-05, + "loss": 0.7792, + "step": 3590 + }, + { + "epoch": 1.02, + "learning_rate": 2.4244069440173938e-05, + "loss": 0.7789, + "step": 3600 + }, + { + "epoch": 1.02, + "learning_rate": 2.413294491516083e-05, + "loss": 0.8127, + "step": 3610 + }, + { + "epoch": 1.02, + "learning_rate": 2.402183753936639e-05, + "loss": 0.816, + "step": 3620 + }, + { + "epoch": 1.03, + "learning_rate": 2.3910749510349574e-05, + "loss": 0.8045, + "step": 3630 + }, + { + "epoch": 1.03, + "learning_rate": 2.3799683025286727e-05, + "loss": 0.8065, + "step": 3640 + }, + { + "epoch": 1.03, + "learning_rate": 2.3688640280928043e-05, + "loss": 0.8016, + "step": 3650 + }, + { + "epoch": 1.04, + "learning_rate": 2.357762347355418e-05, + "loss": 0.7902, + "step": 3660 + }, + { + "epoch": 1.04, + "learning_rate": 2.346663479893277e-05, + "loss": 0.8044, + "step": 3670 + }, + { + "epoch": 1.04, + "learning_rate": 2.3355676452275057e-05, + "loss": 0.8136, + "step": 3680 + }, + { + "epoch": 1.04, + "learning_rate": 2.3244750628192395e-05, + "loss": 0.7885, + "step": 3690 + }, + { + "epoch": 1.05, + "learning_rate": 2.313385952065291e-05, + "loss": 0.7734, + "step": 3700 + }, + { + "epoch": 1.05, + "learning_rate": 2.302300532293806e-05, + "loss": 0.8117, + "step": 3710 + }, + { + "epoch": 1.05, + "learning_rate": 2.2912190227599305e-05, + "loss": 0.7969, + "step": 3720 + }, + { + "epoch": 1.06, + "learning_rate": 2.280141642641468e-05, + "loss": 0.7741, + "step": 3730 + }, + { + "epoch": 1.06, + "learning_rate": 2.26906861103455e-05, + "loss": 0.7996, + "step": 3740 + }, + { + "epoch": 1.06, + "learning_rate": 2.2580001469492968e-05, + "loss": 0.806, + "step": 3750 + }, + { + "epoch": 1.06, + "learning_rate": 2.2469364693054938e-05, + "loss": 0.7969, + "step": 3760 + }, + { + "epoch": 1.07, + "learning_rate": 2.235877796928252e-05, + "loss": 0.8017, + "step": 3770 + }, + { + "epoch": 1.07, + "learning_rate": 2.2248243485436892e-05, + "loss": 0.8066, + "step": 3780 + }, + { + "epoch": 1.07, + "learning_rate": 2.213776342774595e-05, + "loss": 0.7969, + "step": 3790 + }, + { + "epoch": 1.08, + "learning_rate": 2.2027339981361156e-05, + "loss": 0.8008, + "step": 3800 + }, + { + "epoch": 1.08, + "learning_rate": 2.1916975330314235e-05, + "loss": 0.8111, + "step": 3810 + }, + { + "epoch": 1.08, + "learning_rate": 2.1806671657474048e-05, + "loss": 0.7797, + "step": 3820 + }, + { + "epoch": 1.08, + "learning_rate": 2.1696431144503356e-05, + "loss": 0.8016, + "step": 3830 + }, + { + "epoch": 1.09, + "learning_rate": 2.1586255971815738e-05, + "loss": 0.7962, + "step": 3840 + }, + { + "epoch": 1.09, + "learning_rate": 2.147614831853239e-05, + "loss": 0.7897, + "step": 3850 + }, + { + "epoch": 1.09, + "learning_rate": 2.136611036243908e-05, + "loss": 0.7951, + "step": 3860 + }, + { + "epoch": 1.1, + "learning_rate": 2.1256144279943066e-05, + "loss": 0.7856, + "step": 3870 + }, + { + "epoch": 1.1, + "learning_rate": 2.114625224603002e-05, + "loss": 0.7823, + "step": 3880 + }, + { + "epoch": 1.1, + "learning_rate": 2.1036436434221048e-05, + "loss": 0.8101, + "step": 3890 + }, + { + "epoch": 1.1, + "learning_rate": 2.0926699016529656e-05, + "loss": 0.7789, + "step": 3900 + }, + { + "epoch": 1.11, + "learning_rate": 2.0817042163418858e-05, + "loss": 0.7993, + "step": 3910 + }, + { + "epoch": 1.11, + "learning_rate": 2.0707468043758156e-05, + "loss": 0.8107, + "step": 3920 + }, + { + "epoch": 1.11, + "learning_rate": 2.059797882478074e-05, + "loss": 0.8005, + "step": 3930 + }, + { + "epoch": 1.12, + "learning_rate": 2.048857667204053e-05, + "loss": 0.8144, + "step": 3940 + }, + { + "epoch": 1.12, + "learning_rate": 2.0379263749369434e-05, + "loss": 0.7894, + "step": 3950 + }, + { + "epoch": 1.12, + "learning_rate": 2.027004221883447e-05, + "loss": 0.7763, + "step": 3960 + }, + { + "epoch": 1.12, + "learning_rate": 2.016091424069506e-05, + "loss": 0.781, + "step": 3970 + }, + { + "epoch": 1.13, + "learning_rate": 2.0051881973360266e-05, + "loss": 0.7878, + "step": 3980 + }, + { + "epoch": 1.13, + "learning_rate": 1.9942947573346133e-05, + "loss": 0.7956, + "step": 3990 + }, + { + "epoch": 1.13, + "learning_rate": 1.9834113195233e-05, + "loss": 0.8036, + "step": 4000 + } + ], + "max_steps": 7064, + "num_train_epochs": 2, + "total_flos": 7.176649374959665e+18, + "trial_name": null, + "trial_params": null +} diff --git a/sft-qlora/checkpoint-4000/training_args.bin b/sft-qlora/checkpoint-4000/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..e8bd5ea7554270f553d5441a16ce5f0105c78887 --- /dev/null +++ b/sft-qlora/checkpoint-4000/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:131cb9a8eab84a15c7b110e05a98a526550eba69b35fa4c758b43a4caafa6db7 +size 3275 diff --git a/sft-qlora/checkpoint-5000/README.md b/sft-qlora/checkpoint-5000/README.md new file mode 100644 index 0000000000000000000000000000000000000000..d290c902d52b2091d490255d35c9be86df84f437 --- /dev/null +++ b/sft-qlora/checkpoint-5000/README.md @@ -0,0 +1,3 @@ +--- +library_name: peft +--- diff --git a/sft-qlora/checkpoint-5000/adapter_config.json b/sft-qlora/checkpoint-5000/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..2ef4676864a7f782259cd6700dcab8059e8973ab --- /dev/null +++ b/sft-qlora/checkpoint-5000/adapter_config.json @@ -0,0 +1,20 @@ +{ + "base_model_name_or_path": "llama-13b-hf/", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layers_pattern": null, + "layers_to_transform": null, + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "revision": null, + "target_modules": [ + "q_proj", + "v_proj" + ], + "task_type": "CAUSAL_LM" +} \ No newline at end of file diff --git a/sft-qlora/checkpoint-5000/adapter_model.bin b/sft-qlora/checkpoint-5000/adapter_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..56dad0ca0aef7bff02f1b3c9e0f122b2a5601756 --- /dev/null +++ b/sft-qlora/checkpoint-5000/adapter_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:151a1147f4e3125c58e5b805073ef5fefac3e82e9451dc278e58f420a8693f35 +size 26269517 diff --git a/sft-qlora/checkpoint-5000/finetuning_args.json b/sft-qlora/checkpoint-5000/finetuning_args.json new file mode 100644 index 0000000000000000000000000000000000000000..36a921b3eb84159ad54e7697e9d7d3e2fde38fec --- /dev/null +++ b/sft-qlora/checkpoint-5000/finetuning_args.json @@ -0,0 +1,13 @@ +{ + "finetuning_type": "lora", + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "lora_rank": 8, + "lora_target": [ + "q_proj", + "v_proj" + ], + "name_module_trainable": "mlp", + "num_hidden_layers": 32, + "num_layer_trainable": 3 +} diff --git a/sft-qlora/checkpoint-5000/optimizer.pt b/sft-qlora/checkpoint-5000/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..b24a0fe93532cd1efc506949f96a569c304f7c72 --- /dev/null +++ b/sft-qlora/checkpoint-5000/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b55dec35c56aeedc284b504ff1e36d04b70672e21721951179330b23e4f48ec2 +size 52562821 diff --git a/sft-qlora/checkpoint-5000/rng_state_0.pth b/sft-qlora/checkpoint-5000/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..5da9a617f64d389af19f5d0d0570d46b200a2d90 --- /dev/null +++ b/sft-qlora/checkpoint-5000/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa749ac37126149519409e153b6a8d5b3c73f6a7f974468df2f22c8609c043bb +size 18679 diff --git a/sft-qlora/checkpoint-5000/rng_state_1.pth b/sft-qlora/checkpoint-5000/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..920d8b2cf5e3bb4549e93a9710fdd148cabb282b --- /dev/null +++ b/sft-qlora/checkpoint-5000/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba980348eaaec0de5f70f2b287f51dac0c18bf077ed911273607198816af372d +size 18679 diff --git a/sft-qlora/checkpoint-5000/rng_state_2.pth b/sft-qlora/checkpoint-5000/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..db173929b2ebb647af075a56648289e6a8da3f41 --- /dev/null +++ b/sft-qlora/checkpoint-5000/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15ebbc42d20a73ad681f46a8a00221372524e938f097ed8d1826e8d19cdecbee +size 18679 diff --git a/sft-qlora/checkpoint-5000/rng_state_3.pth b/sft-qlora/checkpoint-5000/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..ce789088719c6cfacd5ae332c4d20e73956a21c5 --- /dev/null +++ b/sft-qlora/checkpoint-5000/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3bba97ce2b3768f04f06dc80bc80340b192812258930e01279d032cfa9504c74 +size 18679 diff --git a/sft-qlora/checkpoint-5000/scheduler.pt b/sft-qlora/checkpoint-5000/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e062e230ad61225982368924f6c1eb3e0cde18a --- /dev/null +++ b/sft-qlora/checkpoint-5000/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ac6449e1dc743891165d8dd07849c82d1b65a13f6e200650bec055fa9dde745 +size 627 diff --git a/sft-qlora/checkpoint-5000/trainer_state.json b/sft-qlora/checkpoint-5000/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..cdf47950fc6adb1b5e6d60447e9fbf3d3c3e381e --- /dev/null +++ b/sft-qlora/checkpoint-5000/trainer_state.json @@ -0,0 +1,3016 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 1.4156285390713477, + "global_step": 5000, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.0, + "learning_rate": 4.9999752766303955e-05, + "loss": 1.3185, + "step": 10 + }, + { + "epoch": 0.01, + "learning_rate": 4.999901107010577e-05, + "loss": 1.2795, + "step": 20 + }, + { + "epoch": 0.01, + "learning_rate": 4.999777492607524e-05, + "loss": 1.2266, + "step": 30 + }, + { + "epoch": 0.01, + "learning_rate": 4.9996044358661676e-05, + "loss": 1.19, + "step": 40 + }, + { + "epoch": 0.01, + "learning_rate": 4.9993819402093446e-05, + "loss": 1.1643, + "step": 50 + }, + { + "epoch": 0.02, + "learning_rate": 4.999110010037728e-05, + "loss": 1.1381, + "step": 60 + }, + { + "epoch": 0.02, + "learning_rate": 4.998788650729743e-05, + "loss": 1.1113, + "step": 70 + }, + { + "epoch": 0.02, + "learning_rate": 4.998417868641457e-05, + "loss": 1.0892, + "step": 80 + }, + { + "epoch": 0.03, + "learning_rate": 4.9979976711064556e-05, + "loss": 1.0801, + "step": 90 + }, + { + "epoch": 0.03, + "learning_rate": 4.9975280664357e-05, + "loss": 1.0822, + "step": 100 + }, + { + "epoch": 0.03, + "learning_rate": 4.997009063917356e-05, + "loss": 1.0794, + "step": 110 + }, + { + "epoch": 0.03, + "learning_rate": 4.996440673816617e-05, + "loss": 1.0419, + "step": 120 + }, + { + "epoch": 0.04, + "learning_rate": 4.995822907375498e-05, + "loss": 1.049, + "step": 130 + }, + { + "epoch": 0.04, + "learning_rate": 4.9951557768126136e-05, + "loss": 1.0202, + "step": 140 + }, + { + "epoch": 0.04, + "learning_rate": 4.9944392953229365e-05, + "loss": 1.0226, + "step": 150 + }, + { + "epoch": 0.05, + "learning_rate": 4.993673477077535e-05, + "loss": 0.9927, + "step": 160 + }, + { + "epoch": 0.05, + "learning_rate": 4.9928583372232954e-05, + "loss": 1.0006, + "step": 170 + }, + { + "epoch": 0.05, + "learning_rate": 4.991993891882622e-05, + "loss": 0.9999, + "step": 180 + }, + { + "epoch": 0.05, + "learning_rate": 4.991080158153115e-05, + "loss": 1.0003, + "step": 190 + }, + { + "epoch": 0.06, + "learning_rate": 4.990117154107236e-05, + "loss": 0.9875, + "step": 200 + }, + { + "epoch": 0.06, + "learning_rate": 4.989104898791949e-05, + "loss": 1.004, + "step": 210 + }, + { + "epoch": 0.06, + "learning_rate": 4.988043412228343e-05, + "loss": 0.9835, + "step": 220 + }, + { + "epoch": 0.07, + "learning_rate": 4.986932715411239e-05, + "loss": 0.9765, + "step": 230 + }, + { + "epoch": 0.07, + "learning_rate": 4.985772830308771e-05, + "loss": 0.9755, + "step": 240 + }, + { + "epoch": 0.07, + "learning_rate": 4.9845637798619536e-05, + "loss": 0.9798, + "step": 250 + }, + { + "epoch": 0.07, + "learning_rate": 4.983305587984227e-05, + "loss": 0.9779, + "step": 260 + }, + { + "epoch": 0.08, + "learning_rate": 4.981998279560986e-05, + "loss": 0.9707, + "step": 270 + }, + { + "epoch": 0.08, + "learning_rate": 4.980641880449086e-05, + "loss": 0.987, + "step": 280 + }, + { + "epoch": 0.08, + "learning_rate": 4.9792364174763323e-05, + "loss": 0.9493, + "step": 290 + }, + { + "epoch": 0.08, + "learning_rate": 4.977781918440949e-05, + "loss": 0.9701, + "step": 300 + }, + { + "epoch": 0.09, + "learning_rate": 4.97627841211103e-05, + "loss": 0.9476, + "step": 310 + }, + { + "epoch": 0.09, + "learning_rate": 4.97472592822397e-05, + "loss": 0.9218, + "step": 320 + }, + { + "epoch": 0.09, + "learning_rate": 4.9731244974858746e-05, + "loss": 0.9481, + "step": 330 + }, + { + "epoch": 0.1, + "learning_rate": 4.971474151570955e-05, + "loss": 0.9508, + "step": 340 + }, + { + "epoch": 0.1, + "learning_rate": 4.9697749231209025e-05, + "loss": 0.9587, + "step": 350 + }, + { + "epoch": 0.1, + "learning_rate": 4.968026845744237e-05, + "loss": 0.9371, + "step": 360 + }, + { + "epoch": 0.1, + "learning_rate": 4.96622995401565e-05, + "loss": 0.9242, + "step": 370 + }, + { + "epoch": 0.11, + "learning_rate": 4.9643842834753174e-05, + "loss": 0.9229, + "step": 380 + }, + { + "epoch": 0.11, + "learning_rate": 4.962489870628193e-05, + "loss": 0.9271, + "step": 390 + }, + { + "epoch": 0.11, + "learning_rate": 4.960546752943294e-05, + "loss": 0.9309, + "step": 400 + }, + { + "epoch": 0.12, + "learning_rate": 4.958554968852952e-05, + "loss": 0.9102, + "step": 410 + }, + { + "epoch": 0.12, + "learning_rate": 4.95651455775206e-05, + "loss": 0.9089, + "step": 420 + }, + { + "epoch": 0.12, + "learning_rate": 4.954425559997287e-05, + "loss": 0.9236, + "step": 430 + }, + { + "epoch": 0.12, + "learning_rate": 4.952288016906284e-05, + "loss": 0.9184, + "step": 440 + }, + { + "epoch": 0.13, + "learning_rate": 4.9501019707568665e-05, + "loss": 0.9112, + "step": 450 + }, + { + "epoch": 0.13, + "learning_rate": 4.947867464786174e-05, + "loss": 0.9178, + "step": 460 + }, + { + "epoch": 0.13, + "learning_rate": 4.945584543189823e-05, + "loss": 0.9364, + "step": 470 + }, + { + "epoch": 0.14, + "learning_rate": 4.943253251121022e-05, + "loss": 0.9262, + "step": 480 + }, + { + "epoch": 0.14, + "learning_rate": 4.9408736346896894e-05, + "loss": 0.9037, + "step": 490 + }, + { + "epoch": 0.14, + "learning_rate": 4.938445740961534e-05, + "loss": 0.928, + "step": 500 + }, + { + "epoch": 0.14, + "learning_rate": 4.935969617957126e-05, + "loss": 0.9064, + "step": 510 + }, + { + "epoch": 0.15, + "learning_rate": 4.93344531465095e-05, + "loss": 0.9107, + "step": 520 + }, + { + "epoch": 0.15, + "learning_rate": 4.930872880970432e-05, + "loss": 0.905, + "step": 530 + }, + { + "epoch": 0.15, + "learning_rate": 4.9282523677949556e-05, + "loss": 0.9234, + "step": 540 + }, + { + "epoch": 0.16, + "learning_rate": 4.9255838269548524e-05, + "loss": 0.906, + "step": 550 + }, + { + "epoch": 0.16, + "learning_rate": 4.9228673112303814e-05, + "loss": 0.8885, + "step": 560 + }, + { + "epoch": 0.16, + "learning_rate": 4.9201028743506794e-05, + "loss": 0.9103, + "step": 570 + }, + { + "epoch": 0.16, + "learning_rate": 4.917290570992702e-05, + "loss": 0.895, + "step": 580 + }, + { + "epoch": 0.17, + "learning_rate": 4.9144304567801415e-05, + "loss": 0.8948, + "step": 590 + }, + { + "epoch": 0.17, + "learning_rate": 4.911522588282327e-05, + "loss": 0.9109, + "step": 600 + }, + { + "epoch": 0.17, + "learning_rate": 4.908567023013104e-05, + "loss": 0.8914, + "step": 610 + }, + { + "epoch": 0.18, + "learning_rate": 4.9055638194296994e-05, + "loss": 0.892, + "step": 620 + }, + { + "epoch": 0.18, + "learning_rate": 4.902513036931562e-05, + "loss": 0.9049, + "step": 630 + }, + { + "epoch": 0.18, + "learning_rate": 4.89941473585919e-05, + "loss": 0.904, + "step": 640 + }, + { + "epoch": 0.18, + "learning_rate": 4.89626897749294e-05, + "loss": 0.8983, + "step": 650 + }, + { + "epoch": 0.19, + "learning_rate": 4.893075824051807e-05, + "loss": 0.8884, + "step": 660 + }, + { + "epoch": 0.19, + "learning_rate": 4.889835338692201e-05, + "loss": 0.8886, + "step": 670 + }, + { + "epoch": 0.19, + "learning_rate": 4.886547585506698e-05, + "loss": 0.8998, + "step": 680 + }, + { + "epoch": 0.2, + "learning_rate": 4.8832126295227656e-05, + "loss": 0.8753, + "step": 690 + }, + { + "epoch": 0.2, + "learning_rate": 4.879830536701485e-05, + "loss": 0.8937, + "step": 700 + }, + { + "epoch": 0.2, + "learning_rate": 4.876401373936239e-05, + "loss": 0.8921, + "step": 710 + }, + { + "epoch": 0.2, + "learning_rate": 4.8729252090513964e-05, + "loss": 0.8801, + "step": 720 + }, + { + "epoch": 0.21, + "learning_rate": 4.869402110800963e-05, + "loss": 0.8887, + "step": 730 + }, + { + "epoch": 0.21, + "learning_rate": 4.865832148867228e-05, + "loss": 0.8793, + "step": 740 + }, + { + "epoch": 0.21, + "learning_rate": 4.8622153938593816e-05, + "loss": 0.8811, + "step": 750 + }, + { + "epoch": 0.22, + "learning_rate": 4.8585519173121205e-05, + "loss": 0.8924, + "step": 760 + }, + { + "epoch": 0.22, + "learning_rate": 4.8548417916842324e-05, + "loss": 0.8988, + "step": 770 + }, + { + "epoch": 0.22, + "learning_rate": 4.851085090357163e-05, + "loss": 0.8907, + "step": 780 + }, + { + "epoch": 0.22, + "learning_rate": 4.847281887633565e-05, + "loss": 0.8879, + "step": 790 + }, + { + "epoch": 0.23, + "learning_rate": 4.843432258735827e-05, + "loss": 0.8796, + "step": 800 + }, + { + "epoch": 0.23, + "learning_rate": 4.839536279804589e-05, + "loss": 0.8965, + "step": 810 + }, + { + "epoch": 0.23, + "learning_rate": 4.835594027897231e-05, + "loss": 0.8678, + "step": 820 + }, + { + "epoch": 0.23, + "learning_rate": 4.831605580986355e-05, + "loss": 0.8857, + "step": 830 + }, + { + "epoch": 0.24, + "learning_rate": 4.8275710179582366e-05, + "loss": 0.8805, + "step": 840 + }, + { + "epoch": 0.24, + "learning_rate": 4.823490418611273e-05, + "loss": 0.865, + "step": 850 + }, + { + "epoch": 0.24, + "learning_rate": 4.819363863654395e-05, + "loss": 0.8892, + "step": 860 + }, + { + "epoch": 0.25, + "learning_rate": 4.8151914347054776e-05, + "loss": 0.8589, + "step": 870 + }, + { + "epoch": 0.25, + "learning_rate": 4.810973214289724e-05, + "loss": 0.8819, + "step": 880 + }, + { + "epoch": 0.25, + "learning_rate": 4.806709285838031e-05, + "loss": 0.8778, + "step": 890 + }, + { + "epoch": 0.25, + "learning_rate": 4.8023997336853434e-05, + "loss": 0.8725, + "step": 900 + }, + { + "epoch": 0.26, + "learning_rate": 4.7980446430689804e-05, + "loss": 0.8856, + "step": 910 + }, + { + "epoch": 0.26, + "learning_rate": 4.793644100126954e-05, + "loss": 0.8836, + "step": 920 + }, + { + "epoch": 0.26, + "learning_rate": 4.7891981918962656e-05, + "loss": 0.8684, + "step": 930 + }, + { + "epoch": 0.27, + "learning_rate": 4.784707006311179e-05, + "loss": 0.8671, + "step": 940 + }, + { + "epoch": 0.27, + "learning_rate": 4.780170632201487e-05, + "loss": 0.868, + "step": 950 + }, + { + "epoch": 0.27, + "learning_rate": 4.7755891592907556e-05, + "loss": 0.8683, + "step": 960 + }, + { + "epoch": 0.27, + "learning_rate": 4.7709626781945397e-05, + "loss": 0.8581, + "step": 970 + }, + { + "epoch": 0.28, + "learning_rate": 4.766291280418603e-05, + "loss": 0.8653, + "step": 980 + }, + { + "epoch": 0.28, + "learning_rate": 4.761575058357101e-05, + "loss": 0.8677, + "step": 990 + }, + { + "epoch": 0.28, + "learning_rate": 4.756814105290753e-05, + "loss": 0.8734, + "step": 1000 + }, + { + "epoch": 0.29, + "learning_rate": 4.7520085153850014e-05, + "loss": 0.8583, + "step": 1010 + }, + { + "epoch": 0.29, + "learning_rate": 4.7471583836881476e-05, + "loss": 0.874, + "step": 1020 + }, + { + "epoch": 0.29, + "learning_rate": 4.742263806129469e-05, + "loss": 0.8554, + "step": 1030 + }, + { + "epoch": 0.29, + "learning_rate": 4.737324879517326e-05, + "loss": 0.8807, + "step": 1040 + }, + { + "epoch": 0.3, + "learning_rate": 4.732341701537245e-05, + "loss": 0.8633, + "step": 1050 + }, + { + "epoch": 0.3, + "learning_rate": 4.727314370749988e-05, + "loss": 0.875, + "step": 1060 + }, + { + "epoch": 0.3, + "learning_rate": 4.7222429865896e-05, + "loss": 0.8709, + "step": 1070 + }, + { + "epoch": 0.31, + "learning_rate": 4.717127649361444e-05, + "loss": 0.8634, + "step": 1080 + }, + { + "epoch": 0.31, + "learning_rate": 4.71196846024022e-05, + "loss": 0.8566, + "step": 1090 + }, + { + "epoch": 0.31, + "learning_rate": 4.7067655212679585e-05, + "loss": 0.8667, + "step": 1100 + }, + { + "epoch": 0.31, + "learning_rate": 4.701518935352006e-05, + "loss": 0.8688, + "step": 1110 + }, + { + "epoch": 0.32, + "learning_rate": 4.69622880626299e-05, + "loss": 0.8573, + "step": 1120 + }, + { + "epoch": 0.32, + "learning_rate": 4.690895238632762e-05, + "loss": 0.8576, + "step": 1130 + }, + { + "epoch": 0.32, + "learning_rate": 4.685518337952335e-05, + "loss": 0.8525, + "step": 1140 + }, + { + "epoch": 0.33, + "learning_rate": 4.680098210569789e-05, + "loss": 0.8656, + "step": 1150 + }, + { + "epoch": 0.33, + "learning_rate": 4.674634963688177e-05, + "loss": 0.8703, + "step": 1160 + }, + { + "epoch": 0.33, + "learning_rate": 4.669128705363394e-05, + "loss": 0.8616, + "step": 1170 + }, + { + "epoch": 0.33, + "learning_rate": 4.663579544502049e-05, + "loss": 0.8677, + "step": 1180 + }, + { + "epoch": 0.34, + "learning_rate": 4.657987590859305e-05, + "loss": 0.8525, + "step": 1190 + }, + { + "epoch": 0.34, + "learning_rate": 4.652352955036713e-05, + "loss": 0.8526, + "step": 1200 + }, + { + "epoch": 0.34, + "learning_rate": 4.646675748480019e-05, + "loss": 0.8586, + "step": 1210 + }, + { + "epoch": 0.35, + "learning_rate": 4.640956083476964e-05, + "loss": 0.8542, + "step": 1220 + }, + { + "epoch": 0.35, + "learning_rate": 4.635194073155061e-05, + "loss": 0.8517, + "step": 1230 + }, + { + "epoch": 0.35, + "learning_rate": 4.62938983147936e-05, + "loss": 0.8592, + "step": 1240 + }, + { + "epoch": 0.35, + "learning_rate": 4.62354347325019e-05, + "loss": 0.8678, + "step": 1250 + }, + { + "epoch": 0.36, + "learning_rate": 4.6176551141008916e-05, + "loss": 0.8644, + "step": 1260 + }, + { + "epoch": 0.36, + "learning_rate": 4.611724870495528e-05, + "loss": 0.8541, + "step": 1270 + }, + { + "epoch": 0.36, + "learning_rate": 4.605752859726583e-05, + "loss": 0.8438, + "step": 1280 + }, + { + "epoch": 0.37, + "learning_rate": 4.5997391999126397e-05, + "loss": 0.8604, + "step": 1290 + }, + { + "epoch": 0.37, + "learning_rate": 4.5936840099960465e-05, + "loss": 0.8633, + "step": 1300 + }, + { + "epoch": 0.37, + "learning_rate": 4.587587409740561e-05, + "loss": 0.8437, + "step": 1310 + }, + { + "epoch": 0.37, + "learning_rate": 4.581449519728986e-05, + "loss": 0.8466, + "step": 1320 + }, + { + "epoch": 0.38, + "learning_rate": 4.575270461360779e-05, + "loss": 0.8457, + "step": 1330 + }, + { + "epoch": 0.38, + "learning_rate": 4.569050356849655e-05, + "loss": 0.8477, + "step": 1340 + }, + { + "epoch": 0.38, + "learning_rate": 4.562789329221169e-05, + "loss": 0.8608, + "step": 1350 + }, + { + "epoch": 0.39, + "learning_rate": 4.5564875023102796e-05, + "loss": 0.8555, + "step": 1360 + }, + { + "epoch": 0.39, + "learning_rate": 4.550145000758905e-05, + "loss": 0.8624, + "step": 1370 + }, + { + "epoch": 0.39, + "learning_rate": 4.543761950013453e-05, + "loss": 0.8613, + "step": 1380 + }, + { + "epoch": 0.39, + "learning_rate": 4.537338476322341e-05, + "loss": 0.849, + "step": 1390 + }, + { + "epoch": 0.4, + "learning_rate": 4.530874706733502e-05, + "loss": 0.858, + "step": 1400 + }, + { + "epoch": 0.4, + "learning_rate": 4.524370769091866e-05, + "loss": 0.8468, + "step": 1410 + }, + { + "epoch": 0.4, + "learning_rate": 4.5178267920368366e-05, + "loss": 0.8624, + "step": 1420 + }, + { + "epoch": 0.4, + "learning_rate": 4.511242904999746e-05, + "loss": 0.8464, + "step": 1430 + }, + { + "epoch": 0.41, + "learning_rate": 4.50461923820129e-05, + "loss": 0.8575, + "step": 1440 + }, + { + "epoch": 0.41, + "learning_rate": 4.497955922648961e-05, + "loss": 0.8587, + "step": 1450 + }, + { + "epoch": 0.41, + "learning_rate": 4.491253090134447e-05, + "loss": 0.8517, + "step": 1460 + }, + { + "epoch": 0.42, + "learning_rate": 4.4845108732310355e-05, + "loss": 0.8427, + "step": 1470 + }, + { + "epoch": 0.42, + "learning_rate": 4.4777294052909804e-05, + "loss": 0.8588, + "step": 1480 + }, + { + "epoch": 0.42, + "learning_rate": 4.470908820442873e-05, + "loss": 0.8516, + "step": 1490 + }, + { + "epoch": 0.42, + "learning_rate": 4.464049253588985e-05, + "loss": 0.8408, + "step": 1500 + }, + { + "epoch": 0.43, + "learning_rate": 4.457150840402604e-05, + "loss": 0.8513, + "step": 1510 + }, + { + "epoch": 0.43, + "learning_rate": 4.450213717325343e-05, + "loss": 0.8554, + "step": 1520 + }, + { + "epoch": 0.43, + "learning_rate": 4.443238021564448e-05, + "loss": 0.8598, + "step": 1530 + }, + { + "epoch": 0.44, + "learning_rate": 4.4362238910900835e-05, + "loss": 0.8495, + "step": 1540 + }, + { + "epoch": 0.44, + "learning_rate": 4.4291714646326024e-05, + "loss": 0.8338, + "step": 1550 + }, + { + "epoch": 0.44, + "learning_rate": 4.4220808816797995e-05, + "loss": 0.8576, + "step": 1560 + }, + { + "epoch": 0.44, + "learning_rate": 4.414952282474158e-05, + "loss": 0.8593, + "step": 1570 + }, + { + "epoch": 0.45, + "learning_rate": 4.407785808010073e-05, + "loss": 0.8534, + "step": 1580 + }, + { + "epoch": 0.45, + "learning_rate": 4.400581600031062e-05, + "loss": 0.8564, + "step": 1590 + }, + { + "epoch": 0.45, + "learning_rate": 4.3933398010269614e-05, + "loss": 0.8446, + "step": 1600 + }, + { + "epoch": 0.46, + "learning_rate": 4.386060554231111e-05, + "loss": 0.8445, + "step": 1610 + }, + { + "epoch": 0.46, + "learning_rate": 4.378744003617517e-05, + "loss": 0.8281, + "step": 1620 + }, + { + "epoch": 0.46, + "learning_rate": 4.371390293898007e-05, + "loss": 0.8449, + "step": 1630 + }, + { + "epoch": 0.46, + "learning_rate": 4.3639995705193684e-05, + "loss": 0.8405, + "step": 1640 + }, + { + "epoch": 0.47, + "learning_rate": 4.3565719796604706e-05, + "loss": 0.8349, + "step": 1650 + }, + { + "epoch": 0.47, + "learning_rate": 4.3491076682293715e-05, + "loss": 0.8311, + "step": 1660 + }, + { + "epoch": 0.47, + "learning_rate": 4.341606783860416e-05, + "loss": 0.8383, + "step": 1670 + }, + { + "epoch": 0.48, + "learning_rate": 4.334069474911313e-05, + "loss": 0.8313, + "step": 1680 + }, + { + "epoch": 0.48, + "learning_rate": 4.326495890460204e-05, + "loss": 0.8424, + "step": 1690 + }, + { + "epoch": 0.48, + "learning_rate": 4.3188861803027094e-05, + "loss": 0.8323, + "step": 1700 + }, + { + "epoch": 0.48, + "learning_rate": 4.3112404949489715e-05, + "loss": 0.8501, + "step": 1710 + }, + { + "epoch": 0.49, + "learning_rate": 4.303558985620673e-05, + "loss": 0.8399, + "step": 1720 + }, + { + "epoch": 0.49, + "learning_rate": 4.2958418042480506e-05, + "loss": 0.8184, + "step": 1730 + }, + { + "epoch": 0.49, + "learning_rate": 4.288089103466886e-05, + "loss": 0.8418, + "step": 1740 + }, + { + "epoch": 0.5, + "learning_rate": 4.280301036615489e-05, + "loss": 0.828, + "step": 1750 + }, + { + "epoch": 0.5, + "learning_rate": 4.272477757731662e-05, + "loss": 0.836, + "step": 1760 + }, + { + "epoch": 0.5, + "learning_rate": 4.2646194215496595e-05, + "loss": 0.825, + "step": 1770 + }, + { + "epoch": 0.5, + "learning_rate": 4.2567261834971206e-05, + "loss": 0.8357, + "step": 1780 + }, + { + "epoch": 0.51, + "learning_rate": 4.248798199691998e-05, + "loss": 0.8498, + "step": 1790 + }, + { + "epoch": 0.51, + "learning_rate": 4.2408356269394714e-05, + "loss": 0.8361, + "step": 1800 + }, + { + "epoch": 0.51, + "learning_rate": 4.2328386227288445e-05, + "loss": 0.8237, + "step": 1810 + }, + { + "epoch": 0.52, + "learning_rate": 4.224807345230429e-05, + "loss": 0.8413, + "step": 1820 + }, + { + "epoch": 0.52, + "learning_rate": 4.21674195329242e-05, + "loss": 0.823, + "step": 1830 + }, + { + "epoch": 0.52, + "learning_rate": 4.208642606437748e-05, + "loss": 0.8501, + "step": 1840 + }, + { + "epoch": 0.52, + "learning_rate": 4.2005094648609325e-05, + "loss": 0.8372, + "step": 1850 + }, + { + "epoch": 0.53, + "learning_rate": 4.192342689424903e-05, + "loss": 0.8072, + "step": 1860 + }, + { + "epoch": 0.53, + "learning_rate": 4.184142441657827e-05, + "loss": 0.8409, + "step": 1870 + }, + { + "epoch": 0.53, + "learning_rate": 4.1759088837499095e-05, + "loss": 0.856, + "step": 1880 + }, + { + "epoch": 0.54, + "learning_rate": 4.167642178550186e-05, + "loss": 0.8428, + "step": 1890 + }, + { + "epoch": 0.54, + "learning_rate": 4.159342489563304e-05, + "loss": 0.8344, + "step": 1900 + }, + { + "epoch": 0.54, + "learning_rate": 4.151009980946287e-05, + "loss": 0.8317, + "step": 1910 + }, + { + "epoch": 0.54, + "learning_rate": 4.142644817505284e-05, + "loss": 0.8172, + "step": 1920 + }, + { + "epoch": 0.55, + "learning_rate": 4.1342471646923196e-05, + "loss": 0.8305, + "step": 1930 + }, + { + "epoch": 0.55, + "learning_rate": 4.1258171886020124e-05, + "loss": 0.8303, + "step": 1940 + }, + { + "epoch": 0.55, + "learning_rate": 4.117355055968295e-05, + "loss": 0.8292, + "step": 1950 + }, + { + "epoch": 0.55, + "learning_rate": 4.1088609341611135e-05, + "loss": 0.8162, + "step": 1960 + }, + { + "epoch": 0.56, + "learning_rate": 4.1003349911831166e-05, + "loss": 0.8344, + "step": 1970 + }, + { + "epoch": 0.56, + "learning_rate": 4.091777395666338e-05, + "loss": 0.8545, + "step": 1980 + }, + { + "epoch": 0.56, + "learning_rate": 4.0831883168688534e-05, + "loss": 0.8305, + "step": 1990 + }, + { + "epoch": 0.57, + "learning_rate": 4.07456792467144e-05, + "loss": 0.8365, + "step": 2000 + }, + { + "epoch": 0.57, + "learning_rate": 4.065916389574211e-05, + "loss": 0.8375, + "step": 2010 + }, + { + "epoch": 0.57, + "learning_rate": 4.057233882693246e-05, + "loss": 0.8351, + "step": 2020 + }, + { + "epoch": 0.57, + "learning_rate": 4.048520575757207e-05, + "loss": 0.8165, + "step": 2030 + }, + { + "epoch": 0.58, + "learning_rate": 4.0397766411039395e-05, + "loss": 0.8194, + "step": 2040 + }, + { + "epoch": 0.58, + "learning_rate": 4.031002251677067e-05, + "loss": 0.8218, + "step": 2050 + }, + { + "epoch": 0.58, + "learning_rate": 4.022197581022567e-05, + "loss": 0.8203, + "step": 2060 + }, + { + "epoch": 0.59, + "learning_rate": 4.0133628032853435e-05, + "loss": 0.832, + "step": 2070 + }, + { + "epoch": 0.59, + "learning_rate": 4.004498093205773e-05, + "loss": 0.8066, + "step": 2080 + }, + { + "epoch": 0.59, + "learning_rate": 3.99560362611626e-05, + "loss": 0.8421, + "step": 2090 + }, + { + "epoch": 0.59, + "learning_rate": 3.986679577937762e-05, + "loss": 0.8217, + "step": 2100 + }, + { + "epoch": 0.6, + "learning_rate": 3.9777261251763145e-05, + "loss": 0.8268, + "step": 2110 + }, + { + "epoch": 0.6, + "learning_rate": 3.9687434449195316e-05, + "loss": 0.8321, + "step": 2120 + }, + { + "epoch": 0.6, + "learning_rate": 3.959731714833115e-05, + "loss": 0.8266, + "step": 2130 + }, + { + "epoch": 0.61, + "learning_rate": 3.95069111315733e-05, + "loss": 0.82, + "step": 2140 + }, + { + "epoch": 0.61, + "learning_rate": 3.9416218187034876e-05, + "loss": 0.8347, + "step": 2150 + }, + { + "epoch": 0.61, + "learning_rate": 3.9325240108504016e-05, + "loss": 0.8472, + "step": 2160 + }, + { + "epoch": 0.61, + "learning_rate": 3.923397869540845e-05, + "loss": 0.8092, + "step": 2170 + }, + { + "epoch": 0.62, + "learning_rate": 3.91424357527799e-05, + "loss": 0.8166, + "step": 2180 + }, + { + "epoch": 0.62, + "learning_rate": 3.905061309121837e-05, + "loss": 0.817, + "step": 2190 + }, + { + "epoch": 0.62, + "learning_rate": 3.895851252685634e-05, + "loss": 0.8073, + "step": 2200 + }, + { + "epoch": 0.63, + "learning_rate": 3.886613588132284e-05, + "loss": 0.8355, + "step": 2210 + }, + { + "epoch": 0.63, + "learning_rate": 3.877348498170743e-05, + "loss": 0.8232, + "step": 2220 + }, + { + "epoch": 0.63, + "learning_rate": 3.868056166052407e-05, + "loss": 0.8312, + "step": 2230 + }, + { + "epoch": 0.63, + "learning_rate": 3.858736775567484e-05, + "loss": 0.8215, + "step": 2240 + }, + { + "epoch": 0.64, + "learning_rate": 3.8493905110413626e-05, + "loss": 0.8263, + "step": 2250 + }, + { + "epoch": 0.64, + "learning_rate": 3.8400175573309646e-05, + "loss": 0.8282, + "step": 2260 + }, + { + "epoch": 0.64, + "learning_rate": 3.83061809982109e-05, + "loss": 0.8337, + "step": 2270 + }, + { + "epoch": 0.65, + "learning_rate": 3.821192324420747e-05, + "loss": 0.8291, + "step": 2280 + }, + { + "epoch": 0.65, + "learning_rate": 3.8117404175594795e-05, + "loss": 0.8444, + "step": 2290 + }, + { + "epoch": 0.65, + "learning_rate": 3.8022625661836775e-05, + "loss": 0.8063, + "step": 2300 + }, + { + "epoch": 0.65, + "learning_rate": 3.792758957752879e-05, + "loss": 0.825, + "step": 2310 + }, + { + "epoch": 0.66, + "learning_rate": 3.783229780236062e-05, + "loss": 0.8244, + "step": 2320 + }, + { + "epoch": 0.66, + "learning_rate": 3.773675222107929e-05, + "loss": 0.8086, + "step": 2330 + }, + { + "epoch": 0.66, + "learning_rate": 3.7640954723451784e-05, + "loss": 0.823, + "step": 2340 + }, + { + "epoch": 0.67, + "learning_rate": 3.7544907204227646e-05, + "loss": 0.8177, + "step": 2350 + }, + { + "epoch": 0.67, + "learning_rate": 3.7448611563101536e-05, + "loss": 0.8142, + "step": 2360 + }, + { + "epoch": 0.67, + "learning_rate": 3.735206970467564e-05, + "loss": 0.8236, + "step": 2370 + }, + { + "epoch": 0.67, + "learning_rate": 3.7255283538421984e-05, + "loss": 0.8169, + "step": 2380 + }, + { + "epoch": 0.68, + "learning_rate": 3.7158254978644703e-05, + "loss": 0.8143, + "step": 2390 + }, + { + "epoch": 0.68, + "learning_rate": 3.706098594444216e-05, + "loss": 0.8061, + "step": 2400 + }, + { + "epoch": 0.68, + "learning_rate": 3.6963478359668966e-05, + "loss": 0.8253, + "step": 2410 + }, + { + "epoch": 0.69, + "learning_rate": 3.6865734152897987e-05, + "loss": 0.812, + "step": 2420 + }, + { + "epoch": 0.69, + "learning_rate": 3.676775525738213e-05, + "loss": 0.8263, + "step": 2430 + }, + { + "epoch": 0.69, + "learning_rate": 3.666954361101616e-05, + "loss": 0.8144, + "step": 2440 + }, + { + "epoch": 0.69, + "learning_rate": 3.657110115629832e-05, + "loss": 0.8089, + "step": 2450 + }, + { + "epoch": 0.7, + "learning_rate": 3.647242984029201e-05, + "loss": 0.8155, + "step": 2460 + }, + { + "epoch": 0.7, + "learning_rate": 3.637353161458713e-05, + "loss": 0.8142, + "step": 2470 + }, + { + "epoch": 0.7, + "learning_rate": 3.627440843526158e-05, + "loss": 0.8192, + "step": 2480 + }, + { + "epoch": 0.7, + "learning_rate": 3.6175062262842585e-05, + "loss": 0.8134, + "step": 2490 + }, + { + "epoch": 0.71, + "learning_rate": 3.607549506226784e-05, + "loss": 0.8175, + "step": 2500 + }, + { + "epoch": 0.71, + "learning_rate": 3.5975708802846725e-05, + "loss": 0.8192, + "step": 2510 + }, + { + "epoch": 0.71, + "learning_rate": 3.587570545822128e-05, + "loss": 0.8348, + "step": 2520 + }, + { + "epoch": 0.72, + "learning_rate": 3.5775487006327215e-05, + "loss": 0.8147, + "step": 2530 + }, + { + "epoch": 0.72, + "learning_rate": 3.567505542935482e-05, + "loss": 0.8235, + "step": 2540 + }, + { + "epoch": 0.72, + "learning_rate": 3.557441271370968e-05, + "loss": 0.8175, + "step": 2550 + }, + { + "epoch": 0.72, + "learning_rate": 3.547356084997344e-05, + "loss": 0.8197, + "step": 2560 + }, + { + "epoch": 0.73, + "learning_rate": 3.537250183286443e-05, + "loss": 0.808, + "step": 2570 + }, + { + "epoch": 0.73, + "learning_rate": 3.527123766119818e-05, + "loss": 0.8154, + "step": 2580 + }, + { + "epoch": 0.73, + "learning_rate": 3.5169770337847935e-05, + "loss": 0.8104, + "step": 2590 + }, + { + "epoch": 0.74, + "learning_rate": 3.5068101869705004e-05, + "loss": 0.8318, + "step": 2600 + }, + { + "epoch": 0.74, + "learning_rate": 3.496623426763908e-05, + "loss": 0.8146, + "step": 2610 + }, + { + "epoch": 0.74, + "learning_rate": 3.486416954645846e-05, + "loss": 0.8097, + "step": 2620 + }, + { + "epoch": 0.74, + "learning_rate": 3.4761909724870205e-05, + "loss": 0.8176, + "step": 2630 + }, + { + "epoch": 0.75, + "learning_rate": 3.4659456825440216e-05, + "loss": 0.8284, + "step": 2640 + }, + { + "epoch": 0.75, + "learning_rate": 3.4556812874553204e-05, + "loss": 0.8159, + "step": 2650 + }, + { + "epoch": 0.75, + "learning_rate": 3.445397990237264e-05, + "loss": 0.8204, + "step": 2660 + }, + { + "epoch": 0.76, + "learning_rate": 3.4350959942800584e-05, + "loss": 0.8013, + "step": 2670 + }, + { + "epoch": 0.76, + "learning_rate": 3.424775503343747e-05, + "loss": 0.8196, + "step": 2680 + }, + { + "epoch": 0.76, + "learning_rate": 3.414436721554179e-05, + "loss": 0.802, + "step": 2690 + }, + { + "epoch": 0.76, + "learning_rate": 3.4040798533989745e-05, + "loss": 0.8204, + "step": 2700 + }, + { + "epoch": 0.77, + "learning_rate": 3.3937051037234745e-05, + "loss": 0.8055, + "step": 2710 + }, + { + "epoch": 0.77, + "learning_rate": 3.3833126777266974e-05, + "loss": 0.8171, + "step": 2720 + }, + { + "epoch": 0.77, + "learning_rate": 3.3729027809572735e-05, + "loss": 0.8222, + "step": 2730 + }, + { + "epoch": 0.78, + "learning_rate": 3.3624756193093835e-05, + "loss": 0.8104, + "step": 2740 + }, + { + "epoch": 0.78, + "learning_rate": 3.3520313990186856e-05, + "loss": 0.8147, + "step": 2750 + }, + { + "epoch": 0.78, + "learning_rate": 3.341570326658232e-05, + "loss": 0.8017, + "step": 2760 + }, + { + "epoch": 0.78, + "learning_rate": 3.331092609134392e-05, + "loss": 0.8059, + "step": 2770 + }, + { + "epoch": 0.79, + "learning_rate": 3.32059845368275e-05, + "loss": 0.8204, + "step": 2780 + }, + { + "epoch": 0.79, + "learning_rate": 3.310088067864015e-05, + "loss": 0.812, + "step": 2790 + }, + { + "epoch": 0.79, + "learning_rate": 3.299561659559909e-05, + "loss": 0.8087, + "step": 2800 + }, + { + "epoch": 0.8, + "learning_rate": 3.289019436969057e-05, + "loss": 0.8038, + "step": 2810 + }, + { + "epoch": 0.8, + "learning_rate": 3.278461608602873e-05, + "loss": 0.8094, + "step": 2820 + }, + { + "epoch": 0.8, + "learning_rate": 3.267888383281431e-05, + "loss": 0.8182, + "step": 2830 + }, + { + "epoch": 0.8, + "learning_rate": 3.257299970129336e-05, + "loss": 0.812, + "step": 2840 + }, + { + "epoch": 0.81, + "learning_rate": 3.246696578571592e-05, + "loss": 0.809, + "step": 2850 + }, + { + "epoch": 0.81, + "learning_rate": 3.236078418329452e-05, + "loss": 0.8288, + "step": 2860 + }, + { + "epoch": 0.81, + "learning_rate": 3.225445699416276e-05, + "loss": 0.808, + "step": 2870 + }, + { + "epoch": 0.82, + "learning_rate": 3.214798632133376e-05, + "loss": 0.8127, + "step": 2880 + }, + { + "epoch": 0.82, + "learning_rate": 3.204137427065857e-05, + "loss": 0.8159, + "step": 2890 + }, + { + "epoch": 0.82, + "learning_rate": 3.193462295078448e-05, + "loss": 0.819, + "step": 2900 + }, + { + "epoch": 0.82, + "learning_rate": 3.1827734473113356e-05, + "loss": 0.8108, + "step": 2910 + }, + { + "epoch": 0.83, + "learning_rate": 3.172071095175989e-05, + "loss": 0.8199, + "step": 2920 + }, + { + "epoch": 0.83, + "learning_rate": 3.1613554503509715e-05, + "loss": 0.7977, + "step": 2930 + }, + { + "epoch": 0.83, + "learning_rate": 3.1506267247777645e-05, + "loss": 0.8171, + "step": 2940 + }, + { + "epoch": 0.84, + "learning_rate": 3.139885130656563e-05, + "loss": 0.8064, + "step": 2950 + }, + { + "epoch": 0.84, + "learning_rate": 3.129130880442091e-05, + "loss": 0.8087, + "step": 2960 + }, + { + "epoch": 0.84, + "learning_rate": 3.118364186839389e-05, + "loss": 0.8023, + "step": 2970 + }, + { + "epoch": 0.84, + "learning_rate": 3.107585262799613e-05, + "loss": 0.7978, + "step": 2980 + }, + { + "epoch": 0.85, + "learning_rate": 3.096794321515823e-05, + "loss": 0.8268, + "step": 2990 + }, + { + "epoch": 0.85, + "learning_rate": 3.0859915764187616e-05, + "loss": 0.8129, + "step": 3000 + }, + { + "epoch": 0.85, + "learning_rate": 3.075177241172637e-05, + "loss": 0.8121, + "step": 3010 + }, + { + "epoch": 0.86, + "learning_rate": 3.064351529670895e-05, + "loss": 0.8018, + "step": 3020 + }, + { + "epoch": 0.86, + "learning_rate": 3.0535146560319895e-05, + "loss": 0.8191, + "step": 3030 + }, + { + "epoch": 0.86, + "learning_rate": 3.0426668345951448e-05, + "loss": 0.813, + "step": 3040 + }, + { + "epoch": 0.86, + "learning_rate": 3.031808279916121e-05, + "loss": 0.8252, + "step": 3050 + }, + { + "epoch": 0.87, + "learning_rate": 3.0209392067629676e-05, + "loss": 0.7995, + "step": 3060 + }, + { + "epoch": 0.87, + "learning_rate": 3.010059830111773e-05, + "loss": 0.8162, + "step": 3070 + }, + { + "epoch": 0.87, + "learning_rate": 2.9991703651424184e-05, + "loss": 0.8175, + "step": 3080 + }, + { + "epoch": 0.87, + "learning_rate": 2.988271027234317e-05, + "loss": 0.8076, + "step": 3090 + }, + { + "epoch": 0.88, + "learning_rate": 2.977362031962158e-05, + "loss": 0.8063, + "step": 3100 + }, + { + "epoch": 0.88, + "learning_rate": 2.966443595091637e-05, + "loss": 0.8159, + "step": 3110 + }, + { + "epoch": 0.88, + "learning_rate": 2.9555159325751947e-05, + "loss": 0.8083, + "step": 3120 + }, + { + "epoch": 0.89, + "learning_rate": 2.9445792605477433e-05, + "loss": 0.807, + "step": 3130 + }, + { + "epoch": 0.89, + "learning_rate": 2.933633795322391e-05, + "loss": 0.8123, + "step": 3140 + }, + { + "epoch": 0.89, + "learning_rate": 2.9226797533861615e-05, + "loss": 0.8107, + "step": 3150 + }, + { + "epoch": 0.89, + "learning_rate": 2.9117173513957186e-05, + "loss": 0.8053, + "step": 3160 + }, + { + "epoch": 0.9, + "learning_rate": 2.900746806173074e-05, + "loss": 0.8068, + "step": 3170 + }, + { + "epoch": 0.9, + "learning_rate": 2.889768334701305e-05, + "loss": 0.8086, + "step": 3180 + }, + { + "epoch": 0.9, + "learning_rate": 2.8787821541202564e-05, + "loss": 0.8042, + "step": 3190 + }, + { + "epoch": 0.91, + "learning_rate": 2.8677884817222505e-05, + "loss": 0.8019, + "step": 3200 + }, + { + "epoch": 0.91, + "learning_rate": 2.856787534947789e-05, + "loss": 0.8117, + "step": 3210 + }, + { + "epoch": 0.91, + "learning_rate": 2.8457795313812507e-05, + "loss": 0.8243, + "step": 3220 + }, + { + "epoch": 0.91, + "learning_rate": 2.8347646887465867e-05, + "loss": 0.7953, + "step": 3230 + }, + { + "epoch": 0.92, + "learning_rate": 2.8237432249030183e-05, + "loss": 0.8042, + "step": 3240 + }, + { + "epoch": 0.92, + "learning_rate": 2.812715357840725e-05, + "loss": 0.799, + "step": 3250 + }, + { + "epoch": 0.92, + "learning_rate": 2.801681305676534e-05, + "loss": 0.8093, + "step": 3260 + }, + { + "epoch": 0.93, + "learning_rate": 2.7906412866496034e-05, + "loss": 0.8048, + "step": 3270 + }, + { + "epoch": 0.93, + "learning_rate": 2.7795955191171114e-05, + "loss": 0.8116, + "step": 3280 + }, + { + "epoch": 0.93, + "learning_rate": 2.7685442215499323e-05, + "loss": 0.8151, + "step": 3290 + }, + { + "epoch": 0.93, + "learning_rate": 2.7574876125283176e-05, + "loss": 0.8017, + "step": 3300 + }, + { + "epoch": 0.94, + "learning_rate": 2.7464259107375722e-05, + "loss": 0.8051, + "step": 3310 + }, + { + "epoch": 0.94, + "learning_rate": 2.7353593349637297e-05, + "loss": 0.803, + "step": 3320 + }, + { + "epoch": 0.94, + "learning_rate": 2.7242881040892255e-05, + "loss": 0.8094, + "step": 3330 + }, + { + "epoch": 0.95, + "learning_rate": 2.713212437088564e-05, + "loss": 0.8186, + "step": 3340 + }, + { + "epoch": 0.95, + "learning_rate": 2.702132553023993e-05, + "loss": 0.8041, + "step": 3350 + }, + { + "epoch": 0.95, + "learning_rate": 2.691048671041169e-05, + "loss": 0.8009, + "step": 3360 + }, + { + "epoch": 0.95, + "learning_rate": 2.6799610103648197e-05, + "loss": 0.7931, + "step": 3370 + }, + { + "epoch": 0.96, + "learning_rate": 2.668869790294411e-05, + "loss": 0.8001, + "step": 3380 + }, + { + "epoch": 0.96, + "learning_rate": 2.6577752301998098e-05, + "loss": 0.8167, + "step": 3390 + }, + { + "epoch": 0.96, + "learning_rate": 2.6466775495169437e-05, + "loss": 0.8114, + "step": 3400 + }, + { + "epoch": 0.97, + "learning_rate": 2.6355769677434628e-05, + "loss": 0.8026, + "step": 3410 + }, + { + "epoch": 0.97, + "learning_rate": 2.6244737044343954e-05, + "loss": 0.8063, + "step": 3420 + }, + { + "epoch": 0.97, + "learning_rate": 2.6133679791978065e-05, + "loss": 0.8087, + "step": 3430 + }, + { + "epoch": 0.97, + "learning_rate": 2.602260011690457e-05, + "loss": 0.812, + "step": 3440 + }, + { + "epoch": 0.98, + "learning_rate": 2.591150021613456e-05, + "loss": 0.7899, + "step": 3450 + }, + { + "epoch": 0.98, + "learning_rate": 2.580038228707916e-05, + "loss": 0.798, + "step": 3460 + }, + { + "epoch": 0.98, + "learning_rate": 2.568924852750607e-05, + "loss": 0.826, + "step": 3470 + }, + { + "epoch": 0.99, + "learning_rate": 2.55781011354961e-05, + "loss": 0.8111, + "step": 3480 + }, + { + "epoch": 0.99, + "learning_rate": 2.5466942309399706e-05, + "loss": 0.7924, + "step": 3490 + }, + { + "epoch": 0.99, + "learning_rate": 2.535577424779347e-05, + "loss": 0.8001, + "step": 3500 + }, + { + "epoch": 0.99, + "learning_rate": 2.5244599149436642e-05, + "loss": 0.7906, + "step": 3510 + }, + { + "epoch": 1.0, + "learning_rate": 2.5133419213227684e-05, + "loss": 0.804, + "step": 3520 + }, + { + "epoch": 1.0, + "learning_rate": 2.5022236638160712e-05, + "loss": 0.8123, + "step": 3530 + }, + { + "epoch": 1.0, + "learning_rate": 2.491105362328204e-05, + "loss": 0.8164, + "step": 3540 + }, + { + "epoch": 1.01, + "learning_rate": 2.4799872367646685e-05, + "loss": 0.8169, + "step": 3550 + }, + { + "epoch": 1.01, + "learning_rate": 2.468869507027486e-05, + "loss": 0.7835, + "step": 3560 + }, + { + "epoch": 1.01, + "learning_rate": 2.457752393010851e-05, + "loss": 0.8199, + "step": 3570 + }, + { + "epoch": 1.01, + "learning_rate": 2.4466361145967782e-05, + "loss": 0.8096, + "step": 3580 + }, + { + "epoch": 1.02, + "learning_rate": 2.4355208916507554e-05, + "loss": 0.7792, + "step": 3590 + }, + { + "epoch": 1.02, + "learning_rate": 2.4244069440173938e-05, + "loss": 0.7789, + "step": 3600 + }, + { + "epoch": 1.02, + "learning_rate": 2.413294491516083e-05, + "loss": 0.8127, + "step": 3610 + }, + { + "epoch": 1.02, + "learning_rate": 2.402183753936639e-05, + "loss": 0.816, + "step": 3620 + }, + { + "epoch": 1.03, + "learning_rate": 2.3910749510349574e-05, + "loss": 0.8045, + "step": 3630 + }, + { + "epoch": 1.03, + "learning_rate": 2.3799683025286727e-05, + "loss": 0.8065, + "step": 3640 + }, + { + "epoch": 1.03, + "learning_rate": 2.3688640280928043e-05, + "loss": 0.8016, + "step": 3650 + }, + { + "epoch": 1.04, + "learning_rate": 2.357762347355418e-05, + "loss": 0.7902, + "step": 3660 + }, + { + "epoch": 1.04, + "learning_rate": 2.346663479893277e-05, + "loss": 0.8044, + "step": 3670 + }, + { + "epoch": 1.04, + "learning_rate": 2.3355676452275057e-05, + "loss": 0.8136, + "step": 3680 + }, + { + "epoch": 1.04, + "learning_rate": 2.3244750628192395e-05, + "loss": 0.7885, + "step": 3690 + }, + { + "epoch": 1.05, + "learning_rate": 2.313385952065291e-05, + "loss": 0.7734, + "step": 3700 + }, + { + "epoch": 1.05, + "learning_rate": 2.302300532293806e-05, + "loss": 0.8117, + "step": 3710 + }, + { + "epoch": 1.05, + "learning_rate": 2.2912190227599305e-05, + "loss": 0.7969, + "step": 3720 + }, + { + "epoch": 1.06, + "learning_rate": 2.280141642641468e-05, + "loss": 0.7741, + "step": 3730 + }, + { + "epoch": 1.06, + "learning_rate": 2.26906861103455e-05, + "loss": 0.7996, + "step": 3740 + }, + { + "epoch": 1.06, + "learning_rate": 2.2580001469492968e-05, + "loss": 0.806, + "step": 3750 + }, + { + "epoch": 1.06, + "learning_rate": 2.2469364693054938e-05, + "loss": 0.7969, + "step": 3760 + }, + { + "epoch": 1.07, + "learning_rate": 2.235877796928252e-05, + "loss": 0.8017, + "step": 3770 + }, + { + "epoch": 1.07, + "learning_rate": 2.2248243485436892e-05, + "loss": 0.8066, + "step": 3780 + }, + { + "epoch": 1.07, + "learning_rate": 2.213776342774595e-05, + "loss": 0.7969, + "step": 3790 + }, + { + "epoch": 1.08, + "learning_rate": 2.2027339981361156e-05, + "loss": 0.8008, + "step": 3800 + }, + { + "epoch": 1.08, + "learning_rate": 2.1916975330314235e-05, + "loss": 0.8111, + "step": 3810 + }, + { + "epoch": 1.08, + "learning_rate": 2.1806671657474048e-05, + "loss": 0.7797, + "step": 3820 + }, + { + "epoch": 1.08, + "learning_rate": 2.1696431144503356e-05, + "loss": 0.8016, + "step": 3830 + }, + { + "epoch": 1.09, + "learning_rate": 2.1586255971815738e-05, + "loss": 0.7962, + "step": 3840 + }, + { + "epoch": 1.09, + "learning_rate": 2.147614831853239e-05, + "loss": 0.7897, + "step": 3850 + }, + { + "epoch": 1.09, + "learning_rate": 2.136611036243908e-05, + "loss": 0.7951, + "step": 3860 + }, + { + "epoch": 1.1, + "learning_rate": 2.1256144279943066e-05, + "loss": 0.7856, + "step": 3870 + }, + { + "epoch": 1.1, + "learning_rate": 2.114625224603002e-05, + "loss": 0.7823, + "step": 3880 + }, + { + "epoch": 1.1, + "learning_rate": 2.1036436434221048e-05, + "loss": 0.8101, + "step": 3890 + }, + { + "epoch": 1.1, + "learning_rate": 2.0926699016529656e-05, + "loss": 0.7789, + "step": 3900 + }, + { + "epoch": 1.11, + "learning_rate": 2.0817042163418858e-05, + "loss": 0.7993, + "step": 3910 + }, + { + "epoch": 1.11, + "learning_rate": 2.0707468043758156e-05, + "loss": 0.8107, + "step": 3920 + }, + { + "epoch": 1.11, + "learning_rate": 2.059797882478074e-05, + "loss": 0.8005, + "step": 3930 + }, + { + "epoch": 1.12, + "learning_rate": 2.048857667204053e-05, + "loss": 0.8144, + "step": 3940 + }, + { + "epoch": 1.12, + "learning_rate": 2.0379263749369434e-05, + "loss": 0.7894, + "step": 3950 + }, + { + "epoch": 1.12, + "learning_rate": 2.027004221883447e-05, + "loss": 0.7763, + "step": 3960 + }, + { + "epoch": 1.12, + "learning_rate": 2.016091424069506e-05, + "loss": 0.781, + "step": 3970 + }, + { + "epoch": 1.13, + "learning_rate": 2.0051881973360266e-05, + "loss": 0.7878, + "step": 3980 + }, + { + "epoch": 1.13, + "learning_rate": 1.9942947573346133e-05, + "loss": 0.7956, + "step": 3990 + }, + { + "epoch": 1.13, + "learning_rate": 1.9834113195233e-05, + "loss": 0.8036, + "step": 4000 + }, + { + "epoch": 1.14, + "learning_rate": 1.9725380991622923e-05, + "loss": 0.7945, + "step": 4010 + }, + { + "epoch": 1.14, + "learning_rate": 1.961675311309705e-05, + "loss": 0.7955, + "step": 4020 + }, + { + "epoch": 1.14, + "learning_rate": 1.9508231708173146e-05, + "loss": 0.7772, + "step": 4030 + }, + { + "epoch": 1.14, + "learning_rate": 1.9399818923263056e-05, + "loss": 0.7805, + "step": 4040 + }, + { + "epoch": 1.15, + "learning_rate": 1.929151690263026e-05, + "loss": 0.798, + "step": 4050 + }, + { + "epoch": 1.15, + "learning_rate": 1.918332778834745e-05, + "loss": 0.8183, + "step": 4060 + }, + { + "epoch": 1.15, + "learning_rate": 1.9075253720254217e-05, + "loss": 0.8106, + "step": 4070 + }, + { + "epoch": 1.16, + "learning_rate": 1.8967296835914643e-05, + "loss": 0.7918, + "step": 4080 + }, + { + "epoch": 1.16, + "learning_rate": 1.885945927057511e-05, + "loss": 0.779, + "step": 4090 + }, + { + "epoch": 1.16, + "learning_rate": 1.8751743157122003e-05, + "loss": 0.7881, + "step": 4100 + }, + { + "epoch": 1.16, + "learning_rate": 1.8644150626039534e-05, + "loss": 0.7952, + "step": 4110 + }, + { + "epoch": 1.17, + "learning_rate": 1.8536683805367656e-05, + "loss": 0.7971, + "step": 4120 + }, + { + "epoch": 1.17, + "learning_rate": 1.8429344820659892e-05, + "loss": 0.8005, + "step": 4130 + }, + { + "epoch": 1.17, + "learning_rate": 1.832213579494137e-05, + "loss": 0.8014, + "step": 4140 + }, + { + "epoch": 1.17, + "learning_rate": 1.8215058848666765e-05, + "loss": 0.7883, + "step": 4150 + }, + { + "epoch": 1.18, + "learning_rate": 1.810811609967844e-05, + "loss": 0.7887, + "step": 4160 + }, + { + "epoch": 1.18, + "learning_rate": 1.8001309663164457e-05, + "loss": 0.7719, + "step": 4170 + }, + { + "epoch": 1.18, + "learning_rate": 1.7894641651616838e-05, + "loss": 0.8098, + "step": 4180 + }, + { + "epoch": 1.19, + "learning_rate": 1.7788114174789706e-05, + "loss": 0.7909, + "step": 4190 + }, + { + "epoch": 1.19, + "learning_rate": 1.7681729339657626e-05, + "loss": 0.7791, + "step": 4200 + }, + { + "epoch": 1.19, + "learning_rate": 1.7575489250373867e-05, + "loss": 0.7946, + "step": 4210 + }, + { + "epoch": 1.19, + "learning_rate": 1.746939600822883e-05, + "loss": 0.7973, + "step": 4220 + }, + { + "epoch": 1.2, + "learning_rate": 1.7363451711608445e-05, + "loss": 0.7961, + "step": 4230 + }, + { + "epoch": 1.2, + "learning_rate": 1.7257658455952747e-05, + "loss": 0.797, + "step": 4240 + }, + { + "epoch": 1.2, + "learning_rate": 1.715201833371432e-05, + "loss": 0.7961, + "step": 4250 + }, + { + "epoch": 1.21, + "learning_rate": 1.7046533434317008e-05, + "loss": 0.7918, + "step": 4260 + }, + { + "epoch": 1.21, + "learning_rate": 1.6941205844114522e-05, + "loss": 0.7868, + "step": 4270 + }, + { + "epoch": 1.21, + "learning_rate": 1.683603764634923e-05, + "loss": 0.7843, + "step": 4280 + }, + { + "epoch": 1.21, + "learning_rate": 1.6731030921110903e-05, + "loss": 0.7968, + "step": 4290 + }, + { + "epoch": 1.22, + "learning_rate": 1.6626187745295608e-05, + "loss": 0.7917, + "step": 4300 + }, + { + "epoch": 1.22, + "learning_rate": 1.65215101925646e-05, + "loss": 0.7872, + "step": 4310 + }, + { + "epoch": 1.22, + "learning_rate": 1.641700033330336e-05, + "loss": 0.777, + "step": 4320 + }, + { + "epoch": 1.23, + "learning_rate": 1.6312660234580585e-05, + "loss": 0.8049, + "step": 4330 + }, + { + "epoch": 1.23, + "learning_rate": 1.6208491960107324e-05, + "loss": 0.7897, + "step": 4340 + }, + { + "epoch": 1.23, + "learning_rate": 1.6104497570196193e-05, + "loss": 0.792, + "step": 4350 + }, + { + "epoch": 1.23, + "learning_rate": 1.600067912172057e-05, + "loss": 0.7866, + "step": 4360 + }, + { + "epoch": 1.24, + "learning_rate": 1.5897038668073965e-05, + "loss": 0.8061, + "step": 4370 + }, + { + "epoch": 1.24, + "learning_rate": 1.5793578259129355e-05, + "loss": 0.777, + "step": 4380 + }, + { + "epoch": 1.24, + "learning_rate": 1.5690299941198706e-05, + "loss": 0.7883, + "step": 4390 + }, + { + "epoch": 1.25, + "learning_rate": 1.558720575699242e-05, + "loss": 0.7897, + "step": 4400 + }, + { + "epoch": 1.25, + "learning_rate": 1.548429774557901e-05, + "loss": 0.8014, + "step": 4410 + }, + { + "epoch": 1.25, + "learning_rate": 1.5381577942344688e-05, + "loss": 0.7882, + "step": 4420 + }, + { + "epoch": 1.25, + "learning_rate": 1.5279048378953222e-05, + "loss": 0.7839, + "step": 4430 + }, + { + "epoch": 1.26, + "learning_rate": 1.517671108330561e-05, + "loss": 0.794, + "step": 4440 + }, + { + "epoch": 1.26, + "learning_rate": 1.5074568079500109e-05, + "loss": 0.7739, + "step": 4450 + }, + { + "epoch": 1.26, + "learning_rate": 1.497262138779208e-05, + "loss": 0.7911, + "step": 4460 + }, + { + "epoch": 1.27, + "learning_rate": 1.4870873024554138e-05, + "loss": 0.7907, + "step": 4470 + }, + { + "epoch": 1.27, + "learning_rate": 1.4769325002236183e-05, + "loss": 0.803, + "step": 4480 + }, + { + "epoch": 1.27, + "learning_rate": 1.4667979329325651e-05, + "loss": 0.8048, + "step": 4490 + }, + { + "epoch": 1.27, + "learning_rate": 1.4566838010307754e-05, + "loss": 0.7816, + "step": 4500 + }, + { + "epoch": 1.28, + "learning_rate": 1.4465903045625878e-05, + "loss": 0.7765, + "step": 4510 + }, + { + "epoch": 1.28, + "learning_rate": 1.4365176431641958e-05, + "loss": 0.7916, + "step": 4520 + }, + { + "epoch": 1.28, + "learning_rate": 1.4264660160597057e-05, + "loss": 0.8015, + "step": 4530 + }, + { + "epoch": 1.29, + "learning_rate": 1.41643562205719e-05, + "loss": 0.7826, + "step": 4540 + }, + { + "epoch": 1.29, + "learning_rate": 1.4064266595447584e-05, + "loss": 0.7834, + "step": 4550 + }, + { + "epoch": 1.29, + "learning_rate": 1.3964393264866368e-05, + "loss": 0.7873, + "step": 4560 + }, + { + "epoch": 1.29, + "learning_rate": 1.386473820419244e-05, + "loss": 0.8033, + "step": 4570 + }, + { + "epoch": 1.3, + "learning_rate": 1.376530338447294e-05, + "loss": 0.7973, + "step": 4580 + }, + { + "epoch": 1.3, + "learning_rate": 1.366609077239889e-05, + "loss": 0.7736, + "step": 4590 + }, + { + "epoch": 1.3, + "learning_rate": 1.3567102330266369e-05, + "loss": 0.7968, + "step": 4600 + }, + { + "epoch": 1.31, + "learning_rate": 1.3468340015937642e-05, + "loss": 0.7773, + "step": 4610 + }, + { + "epoch": 1.31, + "learning_rate": 1.3369805782802467e-05, + "loss": 0.7971, + "step": 4620 + }, + { + "epoch": 1.31, + "learning_rate": 1.3271501579739449e-05, + "loss": 0.7808, + "step": 4630 + }, + { + "epoch": 1.31, + "learning_rate": 1.317342935107752e-05, + "loss": 0.7826, + "step": 4640 + }, + { + "epoch": 1.32, + "learning_rate": 1.307559103655743e-05, + "loss": 0.7767, + "step": 4650 + }, + { + "epoch": 1.32, + "learning_rate": 1.2977988571293447e-05, + "loss": 0.7962, + "step": 4660 + }, + { + "epoch": 1.32, + "learning_rate": 1.288062388573501e-05, + "loss": 0.7876, + "step": 4670 + }, + { + "epoch": 1.33, + "learning_rate": 1.2783498905628622e-05, + "loss": 0.782, + "step": 4680 + }, + { + "epoch": 1.33, + "learning_rate": 1.2686615551979702e-05, + "loss": 0.7926, + "step": 4690 + }, + { + "epoch": 1.33, + "learning_rate": 1.2589975741014615e-05, + "loss": 0.7939, + "step": 4700 + }, + { + "epoch": 1.33, + "learning_rate": 1.2493581384142767e-05, + "loss": 0.7992, + "step": 4710 + }, + { + "epoch": 1.34, + "learning_rate": 1.2397434387918824e-05, + "loss": 0.7766, + "step": 4720 + }, + { + "epoch": 1.34, + "learning_rate": 1.2301536654004948e-05, + "loss": 0.7887, + "step": 4730 + }, + { + "epoch": 1.34, + "learning_rate": 1.2205890079133252e-05, + "loss": 0.7927, + "step": 4740 + }, + { + "epoch": 1.34, + "learning_rate": 1.2110496555068218e-05, + "loss": 0.786, + "step": 4750 + }, + { + "epoch": 1.35, + "learning_rate": 1.2015357968569335e-05, + "loss": 0.7821, + "step": 4760 + }, + { + "epoch": 1.35, + "learning_rate": 1.1920476201353763e-05, + "loss": 0.7864, + "step": 4770 + }, + { + "epoch": 1.35, + "learning_rate": 1.1825853130059098e-05, + "loss": 0.7888, + "step": 4780 + }, + { + "epoch": 1.36, + "learning_rate": 1.1731490626206263e-05, + "loss": 0.794, + "step": 4790 + }, + { + "epoch": 1.36, + "learning_rate": 1.16373905561625e-05, + "loss": 0.771, + "step": 4800 + }, + { + "epoch": 1.36, + "learning_rate": 1.1543554781104477e-05, + "loss": 0.7984, + "step": 4810 + }, + { + "epoch": 1.36, + "learning_rate": 1.1449985156981413e-05, + "loss": 0.7961, + "step": 4820 + }, + { + "epoch": 1.37, + "learning_rate": 1.1356683534478451e-05, + "loss": 0.7824, + "step": 4830 + }, + { + "epoch": 1.37, + "learning_rate": 1.1263651758979967e-05, + "loss": 0.7867, + "step": 4840 + }, + { + "epoch": 1.37, + "learning_rate": 1.1170891670533162e-05, + "loss": 0.787, + "step": 4850 + }, + { + "epoch": 1.38, + "learning_rate": 1.107840510381158e-05, + "loss": 0.7789, + "step": 4860 + }, + { + "epoch": 1.38, + "learning_rate": 1.0986193888078882e-05, + "loss": 0.7951, + "step": 4870 + }, + { + "epoch": 1.38, + "learning_rate": 1.0894259847152636e-05, + "loss": 0.8037, + "step": 4880 + }, + { + "epoch": 1.38, + "learning_rate": 1.0802604799368274e-05, + "loss": 0.7901, + "step": 4890 + }, + { + "epoch": 1.39, + "learning_rate": 1.0711230557543078e-05, + "loss": 0.7736, + "step": 4900 + }, + { + "epoch": 1.39, + "learning_rate": 1.0620138928940394e-05, + "loss": 0.7743, + "step": 4910 + }, + { + "epoch": 1.39, + "learning_rate": 1.0529331715233795e-05, + "loss": 0.7971, + "step": 4920 + }, + { + "epoch": 1.4, + "learning_rate": 1.0438810712471553e-05, + "loss": 0.7812, + "step": 4930 + }, + { + "epoch": 1.4, + "learning_rate": 1.0348577711041021e-05, + "loss": 0.7788, + "step": 4940 + }, + { + "epoch": 1.4, + "learning_rate": 1.0258634495633277e-05, + "loss": 0.7866, + "step": 4950 + }, + { + "epoch": 1.4, + "learning_rate": 1.0168982845207797e-05, + "loss": 0.8023, + "step": 4960 + }, + { + "epoch": 1.41, + "learning_rate": 1.0079624532957316e-05, + "loss": 0.7766, + "step": 4970 + }, + { + "epoch": 1.41, + "learning_rate": 9.99056132627267e-06, + "loss": 0.7831, + "step": 4980 + }, + { + "epoch": 1.41, + "learning_rate": 9.901794986707941e-06, + "loss": 0.7927, + "step": 4990 + }, + { + "epoch": 1.42, + "learning_rate": 9.813327269945547e-06, + "loss": 0.7852, + "step": 5000 + } + ], + "max_steps": 7064, + "num_train_epochs": 2, + "total_flos": 8.974930282830365e+18, + "trial_name": null, + "trial_params": null +} diff --git a/sft-qlora/checkpoint-5000/training_args.bin b/sft-qlora/checkpoint-5000/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..e8bd5ea7554270f553d5441a16ce5f0105c78887 --- /dev/null +++ b/sft-qlora/checkpoint-5000/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:131cb9a8eab84a15c7b110e05a98a526550eba69b35fa4c758b43a4caafa6db7 +size 3275 diff --git a/sft-qlora/checkpoint-6000/README.md b/sft-qlora/checkpoint-6000/README.md new file mode 100644 index 0000000000000000000000000000000000000000..d290c902d52b2091d490255d35c9be86df84f437 --- /dev/null +++ b/sft-qlora/checkpoint-6000/README.md @@ -0,0 +1,3 @@ +--- +library_name: peft +--- diff --git a/sft-qlora/checkpoint-6000/adapter_config.json b/sft-qlora/checkpoint-6000/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..2ef4676864a7f782259cd6700dcab8059e8973ab --- /dev/null +++ b/sft-qlora/checkpoint-6000/adapter_config.json @@ -0,0 +1,20 @@ +{ + "base_model_name_or_path": "llama-13b-hf/", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layers_pattern": null, + "layers_to_transform": null, + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "revision": null, + "target_modules": [ + "q_proj", + "v_proj" + ], + "task_type": "CAUSAL_LM" +} \ No newline at end of file diff --git a/sft-qlora/checkpoint-6000/adapter_model.bin b/sft-qlora/checkpoint-6000/adapter_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..6aad3c16626c845035ce3c04ad035c59f0d6f658 --- /dev/null +++ b/sft-qlora/checkpoint-6000/adapter_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26005aa78e3df39013d3ab3e3f986789ad0d32d5ab3001791456c7d50aee4087 +size 26269517 diff --git a/sft-qlora/checkpoint-6000/finetuning_args.json b/sft-qlora/checkpoint-6000/finetuning_args.json new file mode 100644 index 0000000000000000000000000000000000000000..36a921b3eb84159ad54e7697e9d7d3e2fde38fec --- /dev/null +++ b/sft-qlora/checkpoint-6000/finetuning_args.json @@ -0,0 +1,13 @@ +{ + "finetuning_type": "lora", + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "lora_rank": 8, + "lora_target": [ + "q_proj", + "v_proj" + ], + "name_module_trainable": "mlp", + "num_hidden_layers": 32, + "num_layer_trainable": 3 +} diff --git a/sft-qlora/checkpoint-6000/optimizer.pt b/sft-qlora/checkpoint-6000/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..429c523fa447dea9f45e37d5c5749008f86c4af9 --- /dev/null +++ b/sft-qlora/checkpoint-6000/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c51abdaf77ffb142d02f798322d439bc91ad1f813c6ba960601a6ffdf3ad368 +size 52562821 diff --git a/sft-qlora/checkpoint-6000/rng_state_0.pth b/sft-qlora/checkpoint-6000/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..702d1d371cc01630d5c2e0eee505cb4a2f993d10 --- /dev/null +++ b/sft-qlora/checkpoint-6000/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13b5afb582286dc1f513c8f1589e44203922864b0eecb5d968bb7e9bc87aa84e +size 18679 diff --git a/sft-qlora/checkpoint-6000/rng_state_1.pth b/sft-qlora/checkpoint-6000/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..e1828ae0358bc5852c545eb14cc1f0ba8cb5877a --- /dev/null +++ b/sft-qlora/checkpoint-6000/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8746d399d43005a6447ab9d40f84e0907616385574832c925bbc169145ea806 +size 18679 diff --git a/sft-qlora/checkpoint-6000/rng_state_2.pth b/sft-qlora/checkpoint-6000/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..a100206e289a956c92746593dbf9efe0fc9a657a --- /dev/null +++ b/sft-qlora/checkpoint-6000/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d416c799ff2ec4a2d6a8e09383202ff1c136b92ab323e2325bc9a0646fc5cfea +size 18679 diff --git a/sft-qlora/checkpoint-6000/rng_state_3.pth b/sft-qlora/checkpoint-6000/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..b72fb4b99f89e30566ac3f1140ae5beaaf61a996 --- /dev/null +++ b/sft-qlora/checkpoint-6000/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f531295e2f7b930d3678382354c0c47ba5cd0e89c32f49834a21b093eebb41f +size 18679 diff --git a/sft-qlora/checkpoint-6000/scheduler.pt b/sft-qlora/checkpoint-6000/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..19d24341181215740ecf12d3ba7567a376283a28 --- /dev/null +++ b/sft-qlora/checkpoint-6000/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8920d9fb0e6bd69a90d39c3c59dc01e42c3e96ecfd05bee7eec0c8fd5645f87 +size 627 diff --git a/sft-qlora/checkpoint-6000/trainer_state.json b/sft-qlora/checkpoint-6000/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..6e9edbe7d426d5a5fa51a8b3ab9f026084105324 --- /dev/null +++ b/sft-qlora/checkpoint-6000/trainer_state.json @@ -0,0 +1,3616 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 1.6987542468856174, + "global_step": 6000, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.0, + "learning_rate": 4.9999752766303955e-05, + "loss": 1.3185, + "step": 10 + }, + { + "epoch": 0.01, + "learning_rate": 4.999901107010577e-05, + "loss": 1.2795, + "step": 20 + }, + { + "epoch": 0.01, + "learning_rate": 4.999777492607524e-05, + "loss": 1.2266, + "step": 30 + }, + { + "epoch": 0.01, + "learning_rate": 4.9996044358661676e-05, + "loss": 1.19, + "step": 40 + }, + { + "epoch": 0.01, + "learning_rate": 4.9993819402093446e-05, + "loss": 1.1643, + "step": 50 + }, + { + "epoch": 0.02, + "learning_rate": 4.999110010037728e-05, + "loss": 1.1381, + "step": 60 + }, + { + "epoch": 0.02, + "learning_rate": 4.998788650729743e-05, + "loss": 1.1113, + "step": 70 + }, + { + "epoch": 0.02, + "learning_rate": 4.998417868641457e-05, + "loss": 1.0892, + "step": 80 + }, + { + "epoch": 0.03, + "learning_rate": 4.9979976711064556e-05, + "loss": 1.0801, + "step": 90 + }, + { + "epoch": 0.03, + "learning_rate": 4.9975280664357e-05, + "loss": 1.0822, + "step": 100 + }, + { + "epoch": 0.03, + "learning_rate": 4.997009063917356e-05, + "loss": 1.0794, + "step": 110 + }, + { + "epoch": 0.03, + "learning_rate": 4.996440673816617e-05, + "loss": 1.0419, + "step": 120 + }, + { + "epoch": 0.04, + "learning_rate": 4.995822907375498e-05, + "loss": 1.049, + "step": 130 + }, + { + "epoch": 0.04, + "learning_rate": 4.9951557768126136e-05, + "loss": 1.0202, + "step": 140 + }, + { + "epoch": 0.04, + "learning_rate": 4.9944392953229365e-05, + "loss": 1.0226, + "step": 150 + }, + { + "epoch": 0.05, + "learning_rate": 4.993673477077535e-05, + "loss": 0.9927, + "step": 160 + }, + { + "epoch": 0.05, + "learning_rate": 4.9928583372232954e-05, + "loss": 1.0006, + "step": 170 + }, + { + "epoch": 0.05, + "learning_rate": 4.991993891882622e-05, + "loss": 0.9999, + "step": 180 + }, + { + "epoch": 0.05, + "learning_rate": 4.991080158153115e-05, + "loss": 1.0003, + "step": 190 + }, + { + "epoch": 0.06, + "learning_rate": 4.990117154107236e-05, + "loss": 0.9875, + "step": 200 + }, + { + "epoch": 0.06, + "learning_rate": 4.989104898791949e-05, + "loss": 1.004, + "step": 210 + }, + { + "epoch": 0.06, + "learning_rate": 4.988043412228343e-05, + "loss": 0.9835, + "step": 220 + }, + { + "epoch": 0.07, + "learning_rate": 4.986932715411239e-05, + "loss": 0.9765, + "step": 230 + }, + { + "epoch": 0.07, + "learning_rate": 4.985772830308771e-05, + "loss": 0.9755, + "step": 240 + }, + { + "epoch": 0.07, + "learning_rate": 4.9845637798619536e-05, + "loss": 0.9798, + "step": 250 + }, + { + "epoch": 0.07, + "learning_rate": 4.983305587984227e-05, + "loss": 0.9779, + "step": 260 + }, + { + "epoch": 0.08, + "learning_rate": 4.981998279560986e-05, + "loss": 0.9707, + "step": 270 + }, + { + "epoch": 0.08, + "learning_rate": 4.980641880449086e-05, + "loss": 0.987, + "step": 280 + }, + { + "epoch": 0.08, + "learning_rate": 4.9792364174763323e-05, + "loss": 0.9493, + "step": 290 + }, + { + "epoch": 0.08, + "learning_rate": 4.977781918440949e-05, + "loss": 0.9701, + "step": 300 + }, + { + "epoch": 0.09, + "learning_rate": 4.97627841211103e-05, + "loss": 0.9476, + "step": 310 + }, + { + "epoch": 0.09, + "learning_rate": 4.97472592822397e-05, + "loss": 0.9218, + "step": 320 + }, + { + "epoch": 0.09, + "learning_rate": 4.9731244974858746e-05, + "loss": 0.9481, + "step": 330 + }, + { + "epoch": 0.1, + "learning_rate": 4.971474151570955e-05, + "loss": 0.9508, + "step": 340 + }, + { + "epoch": 0.1, + "learning_rate": 4.9697749231209025e-05, + "loss": 0.9587, + "step": 350 + }, + { + "epoch": 0.1, + "learning_rate": 4.968026845744237e-05, + "loss": 0.9371, + "step": 360 + }, + { + "epoch": 0.1, + "learning_rate": 4.96622995401565e-05, + "loss": 0.9242, + "step": 370 + }, + { + "epoch": 0.11, + "learning_rate": 4.9643842834753174e-05, + "loss": 0.9229, + "step": 380 + }, + { + "epoch": 0.11, + "learning_rate": 4.962489870628193e-05, + "loss": 0.9271, + "step": 390 + }, + { + "epoch": 0.11, + "learning_rate": 4.960546752943294e-05, + "loss": 0.9309, + "step": 400 + }, + { + "epoch": 0.12, + "learning_rate": 4.958554968852952e-05, + "loss": 0.9102, + "step": 410 + }, + { + "epoch": 0.12, + "learning_rate": 4.95651455775206e-05, + "loss": 0.9089, + "step": 420 + }, + { + "epoch": 0.12, + "learning_rate": 4.954425559997287e-05, + "loss": 0.9236, + "step": 430 + }, + { + "epoch": 0.12, + "learning_rate": 4.952288016906284e-05, + "loss": 0.9184, + "step": 440 + }, + { + "epoch": 0.13, + "learning_rate": 4.9501019707568665e-05, + "loss": 0.9112, + "step": 450 + }, + { + "epoch": 0.13, + "learning_rate": 4.947867464786174e-05, + "loss": 0.9178, + "step": 460 + }, + { + "epoch": 0.13, + "learning_rate": 4.945584543189823e-05, + "loss": 0.9364, + "step": 470 + }, + { + "epoch": 0.14, + "learning_rate": 4.943253251121022e-05, + "loss": 0.9262, + "step": 480 + }, + { + "epoch": 0.14, + "learning_rate": 4.9408736346896894e-05, + "loss": 0.9037, + "step": 490 + }, + { + "epoch": 0.14, + "learning_rate": 4.938445740961534e-05, + "loss": 0.928, + "step": 500 + }, + { + "epoch": 0.14, + "learning_rate": 4.935969617957126e-05, + "loss": 0.9064, + "step": 510 + }, + { + "epoch": 0.15, + "learning_rate": 4.93344531465095e-05, + "loss": 0.9107, + "step": 520 + }, + { + "epoch": 0.15, + "learning_rate": 4.930872880970432e-05, + "loss": 0.905, + "step": 530 + }, + { + "epoch": 0.15, + "learning_rate": 4.9282523677949556e-05, + "loss": 0.9234, + "step": 540 + }, + { + "epoch": 0.16, + "learning_rate": 4.9255838269548524e-05, + "loss": 0.906, + "step": 550 + }, + { + "epoch": 0.16, + "learning_rate": 4.9228673112303814e-05, + "loss": 0.8885, + "step": 560 + }, + { + "epoch": 0.16, + "learning_rate": 4.9201028743506794e-05, + "loss": 0.9103, + "step": 570 + }, + { + "epoch": 0.16, + "learning_rate": 4.917290570992702e-05, + "loss": 0.895, + "step": 580 + }, + { + "epoch": 0.17, + "learning_rate": 4.9144304567801415e-05, + "loss": 0.8948, + "step": 590 + }, + { + "epoch": 0.17, + "learning_rate": 4.911522588282327e-05, + "loss": 0.9109, + "step": 600 + }, + { + "epoch": 0.17, + "learning_rate": 4.908567023013104e-05, + "loss": 0.8914, + "step": 610 + }, + { + "epoch": 0.18, + "learning_rate": 4.9055638194296994e-05, + "loss": 0.892, + "step": 620 + }, + { + "epoch": 0.18, + "learning_rate": 4.902513036931562e-05, + "loss": 0.9049, + "step": 630 + }, + { + "epoch": 0.18, + "learning_rate": 4.89941473585919e-05, + "loss": 0.904, + "step": 640 + }, + { + "epoch": 0.18, + "learning_rate": 4.89626897749294e-05, + "loss": 0.8983, + "step": 650 + }, + { + "epoch": 0.19, + "learning_rate": 4.893075824051807e-05, + "loss": 0.8884, + "step": 660 + }, + { + "epoch": 0.19, + "learning_rate": 4.889835338692201e-05, + "loss": 0.8886, + "step": 670 + }, + { + "epoch": 0.19, + "learning_rate": 4.886547585506698e-05, + "loss": 0.8998, + "step": 680 + }, + { + "epoch": 0.2, + "learning_rate": 4.8832126295227656e-05, + "loss": 0.8753, + "step": 690 + }, + { + "epoch": 0.2, + "learning_rate": 4.879830536701485e-05, + "loss": 0.8937, + "step": 700 + }, + { + "epoch": 0.2, + "learning_rate": 4.876401373936239e-05, + "loss": 0.8921, + "step": 710 + }, + { + "epoch": 0.2, + "learning_rate": 4.8729252090513964e-05, + "loss": 0.8801, + "step": 720 + }, + { + "epoch": 0.21, + "learning_rate": 4.869402110800963e-05, + "loss": 0.8887, + "step": 730 + }, + { + "epoch": 0.21, + "learning_rate": 4.865832148867228e-05, + "loss": 0.8793, + "step": 740 + }, + { + "epoch": 0.21, + "learning_rate": 4.8622153938593816e-05, + "loss": 0.8811, + "step": 750 + }, + { + "epoch": 0.22, + "learning_rate": 4.8585519173121205e-05, + "loss": 0.8924, + "step": 760 + }, + { + "epoch": 0.22, + "learning_rate": 4.8548417916842324e-05, + "loss": 0.8988, + "step": 770 + }, + { + "epoch": 0.22, + "learning_rate": 4.851085090357163e-05, + "loss": 0.8907, + "step": 780 + }, + { + "epoch": 0.22, + "learning_rate": 4.847281887633565e-05, + "loss": 0.8879, + "step": 790 + }, + { + "epoch": 0.23, + "learning_rate": 4.843432258735827e-05, + "loss": 0.8796, + "step": 800 + }, + { + "epoch": 0.23, + "learning_rate": 4.839536279804589e-05, + "loss": 0.8965, + "step": 810 + }, + { + "epoch": 0.23, + "learning_rate": 4.835594027897231e-05, + "loss": 0.8678, + "step": 820 + }, + { + "epoch": 0.23, + "learning_rate": 4.831605580986355e-05, + "loss": 0.8857, + "step": 830 + }, + { + "epoch": 0.24, + "learning_rate": 4.8275710179582366e-05, + "loss": 0.8805, + "step": 840 + }, + { + "epoch": 0.24, + "learning_rate": 4.823490418611273e-05, + "loss": 0.865, + "step": 850 + }, + { + "epoch": 0.24, + "learning_rate": 4.819363863654395e-05, + "loss": 0.8892, + "step": 860 + }, + { + "epoch": 0.25, + "learning_rate": 4.8151914347054776e-05, + "loss": 0.8589, + "step": 870 + }, + { + "epoch": 0.25, + "learning_rate": 4.810973214289724e-05, + "loss": 0.8819, + "step": 880 + }, + { + "epoch": 0.25, + "learning_rate": 4.806709285838031e-05, + "loss": 0.8778, + "step": 890 + }, + { + "epoch": 0.25, + "learning_rate": 4.8023997336853434e-05, + "loss": 0.8725, + "step": 900 + }, + { + "epoch": 0.26, + "learning_rate": 4.7980446430689804e-05, + "loss": 0.8856, + "step": 910 + }, + { + "epoch": 0.26, + "learning_rate": 4.793644100126954e-05, + "loss": 0.8836, + "step": 920 + }, + { + "epoch": 0.26, + "learning_rate": 4.7891981918962656e-05, + "loss": 0.8684, + "step": 930 + }, + { + "epoch": 0.27, + "learning_rate": 4.784707006311179e-05, + "loss": 0.8671, + "step": 940 + }, + { + "epoch": 0.27, + "learning_rate": 4.780170632201487e-05, + "loss": 0.868, + "step": 950 + }, + { + "epoch": 0.27, + "learning_rate": 4.7755891592907556e-05, + "loss": 0.8683, + "step": 960 + }, + { + "epoch": 0.27, + "learning_rate": 4.7709626781945397e-05, + "loss": 0.8581, + "step": 970 + }, + { + "epoch": 0.28, + "learning_rate": 4.766291280418603e-05, + "loss": 0.8653, + "step": 980 + }, + { + "epoch": 0.28, + "learning_rate": 4.761575058357101e-05, + "loss": 0.8677, + "step": 990 + }, + { + "epoch": 0.28, + "learning_rate": 4.756814105290753e-05, + "loss": 0.8734, + "step": 1000 + }, + { + "epoch": 0.29, + "learning_rate": 4.7520085153850014e-05, + "loss": 0.8583, + "step": 1010 + }, + { + "epoch": 0.29, + "learning_rate": 4.7471583836881476e-05, + "loss": 0.874, + "step": 1020 + }, + { + "epoch": 0.29, + "learning_rate": 4.742263806129469e-05, + "loss": 0.8554, + "step": 1030 + }, + { + "epoch": 0.29, + "learning_rate": 4.737324879517326e-05, + "loss": 0.8807, + "step": 1040 + }, + { + "epoch": 0.3, + "learning_rate": 4.732341701537245e-05, + "loss": 0.8633, + "step": 1050 + }, + { + "epoch": 0.3, + "learning_rate": 4.727314370749988e-05, + "loss": 0.875, + "step": 1060 + }, + { + "epoch": 0.3, + "learning_rate": 4.7222429865896e-05, + "loss": 0.8709, + "step": 1070 + }, + { + "epoch": 0.31, + "learning_rate": 4.717127649361444e-05, + "loss": 0.8634, + "step": 1080 + }, + { + "epoch": 0.31, + "learning_rate": 4.71196846024022e-05, + "loss": 0.8566, + "step": 1090 + }, + { + "epoch": 0.31, + "learning_rate": 4.7067655212679585e-05, + "loss": 0.8667, + "step": 1100 + }, + { + "epoch": 0.31, + "learning_rate": 4.701518935352006e-05, + "loss": 0.8688, + "step": 1110 + }, + { + "epoch": 0.32, + "learning_rate": 4.69622880626299e-05, + "loss": 0.8573, + "step": 1120 + }, + { + "epoch": 0.32, + "learning_rate": 4.690895238632762e-05, + "loss": 0.8576, + "step": 1130 + }, + { + "epoch": 0.32, + "learning_rate": 4.685518337952335e-05, + "loss": 0.8525, + "step": 1140 + }, + { + "epoch": 0.33, + "learning_rate": 4.680098210569789e-05, + "loss": 0.8656, + "step": 1150 + }, + { + "epoch": 0.33, + "learning_rate": 4.674634963688177e-05, + "loss": 0.8703, + "step": 1160 + }, + { + "epoch": 0.33, + "learning_rate": 4.669128705363394e-05, + "loss": 0.8616, + "step": 1170 + }, + { + "epoch": 0.33, + "learning_rate": 4.663579544502049e-05, + "loss": 0.8677, + "step": 1180 + }, + { + "epoch": 0.34, + "learning_rate": 4.657987590859305e-05, + "loss": 0.8525, + "step": 1190 + }, + { + "epoch": 0.34, + "learning_rate": 4.652352955036713e-05, + "loss": 0.8526, + "step": 1200 + }, + { + "epoch": 0.34, + "learning_rate": 4.646675748480019e-05, + "loss": 0.8586, + "step": 1210 + }, + { + "epoch": 0.35, + "learning_rate": 4.640956083476964e-05, + "loss": 0.8542, + "step": 1220 + }, + { + "epoch": 0.35, + "learning_rate": 4.635194073155061e-05, + "loss": 0.8517, + "step": 1230 + }, + { + "epoch": 0.35, + "learning_rate": 4.62938983147936e-05, + "loss": 0.8592, + "step": 1240 + }, + { + "epoch": 0.35, + "learning_rate": 4.62354347325019e-05, + "loss": 0.8678, + "step": 1250 + }, + { + "epoch": 0.36, + "learning_rate": 4.6176551141008916e-05, + "loss": 0.8644, + "step": 1260 + }, + { + "epoch": 0.36, + "learning_rate": 4.611724870495528e-05, + "loss": 0.8541, + "step": 1270 + }, + { + "epoch": 0.36, + "learning_rate": 4.605752859726583e-05, + "loss": 0.8438, + "step": 1280 + }, + { + "epoch": 0.37, + "learning_rate": 4.5997391999126397e-05, + "loss": 0.8604, + "step": 1290 + }, + { + "epoch": 0.37, + "learning_rate": 4.5936840099960465e-05, + "loss": 0.8633, + "step": 1300 + }, + { + "epoch": 0.37, + "learning_rate": 4.587587409740561e-05, + "loss": 0.8437, + "step": 1310 + }, + { + "epoch": 0.37, + "learning_rate": 4.581449519728986e-05, + "loss": 0.8466, + "step": 1320 + }, + { + "epoch": 0.38, + "learning_rate": 4.575270461360779e-05, + "loss": 0.8457, + "step": 1330 + }, + { + "epoch": 0.38, + "learning_rate": 4.569050356849655e-05, + "loss": 0.8477, + "step": 1340 + }, + { + "epoch": 0.38, + "learning_rate": 4.562789329221169e-05, + "loss": 0.8608, + "step": 1350 + }, + { + "epoch": 0.39, + "learning_rate": 4.5564875023102796e-05, + "loss": 0.8555, + "step": 1360 + }, + { + "epoch": 0.39, + "learning_rate": 4.550145000758905e-05, + "loss": 0.8624, + "step": 1370 + }, + { + "epoch": 0.39, + "learning_rate": 4.543761950013453e-05, + "loss": 0.8613, + "step": 1380 + }, + { + "epoch": 0.39, + "learning_rate": 4.537338476322341e-05, + "loss": 0.849, + "step": 1390 + }, + { + "epoch": 0.4, + "learning_rate": 4.530874706733502e-05, + "loss": 0.858, + "step": 1400 + }, + { + "epoch": 0.4, + "learning_rate": 4.524370769091866e-05, + "loss": 0.8468, + "step": 1410 + }, + { + "epoch": 0.4, + "learning_rate": 4.5178267920368366e-05, + "loss": 0.8624, + "step": 1420 + }, + { + "epoch": 0.4, + "learning_rate": 4.511242904999746e-05, + "loss": 0.8464, + "step": 1430 + }, + { + "epoch": 0.41, + "learning_rate": 4.50461923820129e-05, + "loss": 0.8575, + "step": 1440 + }, + { + "epoch": 0.41, + "learning_rate": 4.497955922648961e-05, + "loss": 0.8587, + "step": 1450 + }, + { + "epoch": 0.41, + "learning_rate": 4.491253090134447e-05, + "loss": 0.8517, + "step": 1460 + }, + { + "epoch": 0.42, + "learning_rate": 4.4845108732310355e-05, + "loss": 0.8427, + "step": 1470 + }, + { + "epoch": 0.42, + "learning_rate": 4.4777294052909804e-05, + "loss": 0.8588, + "step": 1480 + }, + { + "epoch": 0.42, + "learning_rate": 4.470908820442873e-05, + "loss": 0.8516, + "step": 1490 + }, + { + "epoch": 0.42, + "learning_rate": 4.464049253588985e-05, + "loss": 0.8408, + "step": 1500 + }, + { + "epoch": 0.43, + "learning_rate": 4.457150840402604e-05, + "loss": 0.8513, + "step": 1510 + }, + { + "epoch": 0.43, + "learning_rate": 4.450213717325343e-05, + "loss": 0.8554, + "step": 1520 + }, + { + "epoch": 0.43, + "learning_rate": 4.443238021564448e-05, + "loss": 0.8598, + "step": 1530 + }, + { + "epoch": 0.44, + "learning_rate": 4.4362238910900835e-05, + "loss": 0.8495, + "step": 1540 + }, + { + "epoch": 0.44, + "learning_rate": 4.4291714646326024e-05, + "loss": 0.8338, + "step": 1550 + }, + { + "epoch": 0.44, + "learning_rate": 4.4220808816797995e-05, + "loss": 0.8576, + "step": 1560 + }, + { + "epoch": 0.44, + "learning_rate": 4.414952282474158e-05, + "loss": 0.8593, + "step": 1570 + }, + { + "epoch": 0.45, + "learning_rate": 4.407785808010073e-05, + "loss": 0.8534, + "step": 1580 + }, + { + "epoch": 0.45, + "learning_rate": 4.400581600031062e-05, + "loss": 0.8564, + "step": 1590 + }, + { + "epoch": 0.45, + "learning_rate": 4.3933398010269614e-05, + "loss": 0.8446, + "step": 1600 + }, + { + "epoch": 0.46, + "learning_rate": 4.386060554231111e-05, + "loss": 0.8445, + "step": 1610 + }, + { + "epoch": 0.46, + "learning_rate": 4.378744003617517e-05, + "loss": 0.8281, + "step": 1620 + }, + { + "epoch": 0.46, + "learning_rate": 4.371390293898007e-05, + "loss": 0.8449, + "step": 1630 + }, + { + "epoch": 0.46, + "learning_rate": 4.3639995705193684e-05, + "loss": 0.8405, + "step": 1640 + }, + { + "epoch": 0.47, + "learning_rate": 4.3565719796604706e-05, + "loss": 0.8349, + "step": 1650 + }, + { + "epoch": 0.47, + "learning_rate": 4.3491076682293715e-05, + "loss": 0.8311, + "step": 1660 + }, + { + "epoch": 0.47, + "learning_rate": 4.341606783860416e-05, + "loss": 0.8383, + "step": 1670 + }, + { + "epoch": 0.48, + "learning_rate": 4.334069474911313e-05, + "loss": 0.8313, + "step": 1680 + }, + { + "epoch": 0.48, + "learning_rate": 4.326495890460204e-05, + "loss": 0.8424, + "step": 1690 + }, + { + "epoch": 0.48, + "learning_rate": 4.3188861803027094e-05, + "loss": 0.8323, + "step": 1700 + }, + { + "epoch": 0.48, + "learning_rate": 4.3112404949489715e-05, + "loss": 0.8501, + "step": 1710 + }, + { + "epoch": 0.49, + "learning_rate": 4.303558985620673e-05, + "loss": 0.8399, + "step": 1720 + }, + { + "epoch": 0.49, + "learning_rate": 4.2958418042480506e-05, + "loss": 0.8184, + "step": 1730 + }, + { + "epoch": 0.49, + "learning_rate": 4.288089103466886e-05, + "loss": 0.8418, + "step": 1740 + }, + { + "epoch": 0.5, + "learning_rate": 4.280301036615489e-05, + "loss": 0.828, + "step": 1750 + }, + { + "epoch": 0.5, + "learning_rate": 4.272477757731662e-05, + "loss": 0.836, + "step": 1760 + }, + { + "epoch": 0.5, + "learning_rate": 4.2646194215496595e-05, + "loss": 0.825, + "step": 1770 + }, + { + "epoch": 0.5, + "learning_rate": 4.2567261834971206e-05, + "loss": 0.8357, + "step": 1780 + }, + { + "epoch": 0.51, + "learning_rate": 4.248798199691998e-05, + "loss": 0.8498, + "step": 1790 + }, + { + "epoch": 0.51, + "learning_rate": 4.2408356269394714e-05, + "loss": 0.8361, + "step": 1800 + }, + { + "epoch": 0.51, + "learning_rate": 4.2328386227288445e-05, + "loss": 0.8237, + "step": 1810 + }, + { + "epoch": 0.52, + "learning_rate": 4.224807345230429e-05, + "loss": 0.8413, + "step": 1820 + }, + { + "epoch": 0.52, + "learning_rate": 4.21674195329242e-05, + "loss": 0.823, + "step": 1830 + }, + { + "epoch": 0.52, + "learning_rate": 4.208642606437748e-05, + "loss": 0.8501, + "step": 1840 + }, + { + "epoch": 0.52, + "learning_rate": 4.2005094648609325e-05, + "loss": 0.8372, + "step": 1850 + }, + { + "epoch": 0.53, + "learning_rate": 4.192342689424903e-05, + "loss": 0.8072, + "step": 1860 + }, + { + "epoch": 0.53, + "learning_rate": 4.184142441657827e-05, + "loss": 0.8409, + "step": 1870 + }, + { + "epoch": 0.53, + "learning_rate": 4.1759088837499095e-05, + "loss": 0.856, + "step": 1880 + }, + { + "epoch": 0.54, + "learning_rate": 4.167642178550186e-05, + "loss": 0.8428, + "step": 1890 + }, + { + "epoch": 0.54, + "learning_rate": 4.159342489563304e-05, + "loss": 0.8344, + "step": 1900 + }, + { + "epoch": 0.54, + "learning_rate": 4.151009980946287e-05, + "loss": 0.8317, + "step": 1910 + }, + { + "epoch": 0.54, + "learning_rate": 4.142644817505284e-05, + "loss": 0.8172, + "step": 1920 + }, + { + "epoch": 0.55, + "learning_rate": 4.1342471646923196e-05, + "loss": 0.8305, + "step": 1930 + }, + { + "epoch": 0.55, + "learning_rate": 4.1258171886020124e-05, + "loss": 0.8303, + "step": 1940 + }, + { + "epoch": 0.55, + "learning_rate": 4.117355055968295e-05, + "loss": 0.8292, + "step": 1950 + }, + { + "epoch": 0.55, + "learning_rate": 4.1088609341611135e-05, + "loss": 0.8162, + "step": 1960 + }, + { + "epoch": 0.56, + "learning_rate": 4.1003349911831166e-05, + "loss": 0.8344, + "step": 1970 + }, + { + "epoch": 0.56, + "learning_rate": 4.091777395666338e-05, + "loss": 0.8545, + "step": 1980 + }, + { + "epoch": 0.56, + "learning_rate": 4.0831883168688534e-05, + "loss": 0.8305, + "step": 1990 + }, + { + "epoch": 0.57, + "learning_rate": 4.07456792467144e-05, + "loss": 0.8365, + "step": 2000 + }, + { + "epoch": 0.57, + "learning_rate": 4.065916389574211e-05, + "loss": 0.8375, + "step": 2010 + }, + { + "epoch": 0.57, + "learning_rate": 4.057233882693246e-05, + "loss": 0.8351, + "step": 2020 + }, + { + "epoch": 0.57, + "learning_rate": 4.048520575757207e-05, + "loss": 0.8165, + "step": 2030 + }, + { + "epoch": 0.58, + "learning_rate": 4.0397766411039395e-05, + "loss": 0.8194, + "step": 2040 + }, + { + "epoch": 0.58, + "learning_rate": 4.031002251677067e-05, + "loss": 0.8218, + "step": 2050 + }, + { + "epoch": 0.58, + "learning_rate": 4.022197581022567e-05, + "loss": 0.8203, + "step": 2060 + }, + { + "epoch": 0.59, + "learning_rate": 4.0133628032853435e-05, + "loss": 0.832, + "step": 2070 + }, + { + "epoch": 0.59, + "learning_rate": 4.004498093205773e-05, + "loss": 0.8066, + "step": 2080 + }, + { + "epoch": 0.59, + "learning_rate": 3.99560362611626e-05, + "loss": 0.8421, + "step": 2090 + }, + { + "epoch": 0.59, + "learning_rate": 3.986679577937762e-05, + "loss": 0.8217, + "step": 2100 + }, + { + "epoch": 0.6, + "learning_rate": 3.9777261251763145e-05, + "loss": 0.8268, + "step": 2110 + }, + { + "epoch": 0.6, + "learning_rate": 3.9687434449195316e-05, + "loss": 0.8321, + "step": 2120 + }, + { + "epoch": 0.6, + "learning_rate": 3.959731714833115e-05, + "loss": 0.8266, + "step": 2130 + }, + { + "epoch": 0.61, + "learning_rate": 3.95069111315733e-05, + "loss": 0.82, + "step": 2140 + }, + { + "epoch": 0.61, + "learning_rate": 3.9416218187034876e-05, + "loss": 0.8347, + "step": 2150 + }, + { + "epoch": 0.61, + "learning_rate": 3.9325240108504016e-05, + "loss": 0.8472, + "step": 2160 + }, + { + "epoch": 0.61, + "learning_rate": 3.923397869540845e-05, + "loss": 0.8092, + "step": 2170 + }, + { + "epoch": 0.62, + "learning_rate": 3.91424357527799e-05, + "loss": 0.8166, + "step": 2180 + }, + { + "epoch": 0.62, + "learning_rate": 3.905061309121837e-05, + "loss": 0.817, + "step": 2190 + }, + { + "epoch": 0.62, + "learning_rate": 3.895851252685634e-05, + "loss": 0.8073, + "step": 2200 + }, + { + "epoch": 0.63, + "learning_rate": 3.886613588132284e-05, + "loss": 0.8355, + "step": 2210 + }, + { + "epoch": 0.63, + "learning_rate": 3.877348498170743e-05, + "loss": 0.8232, + "step": 2220 + }, + { + "epoch": 0.63, + "learning_rate": 3.868056166052407e-05, + "loss": 0.8312, + "step": 2230 + }, + { + "epoch": 0.63, + "learning_rate": 3.858736775567484e-05, + "loss": 0.8215, + "step": 2240 + }, + { + "epoch": 0.64, + "learning_rate": 3.8493905110413626e-05, + "loss": 0.8263, + "step": 2250 + }, + { + "epoch": 0.64, + "learning_rate": 3.8400175573309646e-05, + "loss": 0.8282, + "step": 2260 + }, + { + "epoch": 0.64, + "learning_rate": 3.83061809982109e-05, + "loss": 0.8337, + "step": 2270 + }, + { + "epoch": 0.65, + "learning_rate": 3.821192324420747e-05, + "loss": 0.8291, + "step": 2280 + }, + { + "epoch": 0.65, + "learning_rate": 3.8117404175594795e-05, + "loss": 0.8444, + "step": 2290 + }, + { + "epoch": 0.65, + "learning_rate": 3.8022625661836775e-05, + "loss": 0.8063, + "step": 2300 + }, + { + "epoch": 0.65, + "learning_rate": 3.792758957752879e-05, + "loss": 0.825, + "step": 2310 + }, + { + "epoch": 0.66, + "learning_rate": 3.783229780236062e-05, + "loss": 0.8244, + "step": 2320 + }, + { + "epoch": 0.66, + "learning_rate": 3.773675222107929e-05, + "loss": 0.8086, + "step": 2330 + }, + { + "epoch": 0.66, + "learning_rate": 3.7640954723451784e-05, + "loss": 0.823, + "step": 2340 + }, + { + "epoch": 0.67, + "learning_rate": 3.7544907204227646e-05, + "loss": 0.8177, + "step": 2350 + }, + { + "epoch": 0.67, + "learning_rate": 3.7448611563101536e-05, + "loss": 0.8142, + "step": 2360 + }, + { + "epoch": 0.67, + "learning_rate": 3.735206970467564e-05, + "loss": 0.8236, + "step": 2370 + }, + { + "epoch": 0.67, + "learning_rate": 3.7255283538421984e-05, + "loss": 0.8169, + "step": 2380 + }, + { + "epoch": 0.68, + "learning_rate": 3.7158254978644703e-05, + "loss": 0.8143, + "step": 2390 + }, + { + "epoch": 0.68, + "learning_rate": 3.706098594444216e-05, + "loss": 0.8061, + "step": 2400 + }, + { + "epoch": 0.68, + "learning_rate": 3.6963478359668966e-05, + "loss": 0.8253, + "step": 2410 + }, + { + "epoch": 0.69, + "learning_rate": 3.6865734152897987e-05, + "loss": 0.812, + "step": 2420 + }, + { + "epoch": 0.69, + "learning_rate": 3.676775525738213e-05, + "loss": 0.8263, + "step": 2430 + }, + { + "epoch": 0.69, + "learning_rate": 3.666954361101616e-05, + "loss": 0.8144, + "step": 2440 + }, + { + "epoch": 0.69, + "learning_rate": 3.657110115629832e-05, + "loss": 0.8089, + "step": 2450 + }, + { + "epoch": 0.7, + "learning_rate": 3.647242984029201e-05, + "loss": 0.8155, + "step": 2460 + }, + { + "epoch": 0.7, + "learning_rate": 3.637353161458713e-05, + "loss": 0.8142, + "step": 2470 + }, + { + "epoch": 0.7, + "learning_rate": 3.627440843526158e-05, + "loss": 0.8192, + "step": 2480 + }, + { + "epoch": 0.7, + "learning_rate": 3.6175062262842585e-05, + "loss": 0.8134, + "step": 2490 + }, + { + "epoch": 0.71, + "learning_rate": 3.607549506226784e-05, + "loss": 0.8175, + "step": 2500 + }, + { + "epoch": 0.71, + "learning_rate": 3.5975708802846725e-05, + "loss": 0.8192, + "step": 2510 + }, + { + "epoch": 0.71, + "learning_rate": 3.587570545822128e-05, + "loss": 0.8348, + "step": 2520 + }, + { + "epoch": 0.72, + "learning_rate": 3.5775487006327215e-05, + "loss": 0.8147, + "step": 2530 + }, + { + "epoch": 0.72, + "learning_rate": 3.567505542935482e-05, + "loss": 0.8235, + "step": 2540 + }, + { + "epoch": 0.72, + "learning_rate": 3.557441271370968e-05, + "loss": 0.8175, + "step": 2550 + }, + { + "epoch": 0.72, + "learning_rate": 3.547356084997344e-05, + "loss": 0.8197, + "step": 2560 + }, + { + "epoch": 0.73, + "learning_rate": 3.537250183286443e-05, + "loss": 0.808, + "step": 2570 + }, + { + "epoch": 0.73, + "learning_rate": 3.527123766119818e-05, + "loss": 0.8154, + "step": 2580 + }, + { + "epoch": 0.73, + "learning_rate": 3.5169770337847935e-05, + "loss": 0.8104, + "step": 2590 + }, + { + "epoch": 0.74, + "learning_rate": 3.5068101869705004e-05, + "loss": 0.8318, + "step": 2600 + }, + { + "epoch": 0.74, + "learning_rate": 3.496623426763908e-05, + "loss": 0.8146, + "step": 2610 + }, + { + "epoch": 0.74, + "learning_rate": 3.486416954645846e-05, + "loss": 0.8097, + "step": 2620 + }, + { + "epoch": 0.74, + "learning_rate": 3.4761909724870205e-05, + "loss": 0.8176, + "step": 2630 + }, + { + "epoch": 0.75, + "learning_rate": 3.4659456825440216e-05, + "loss": 0.8284, + "step": 2640 + }, + { + "epoch": 0.75, + "learning_rate": 3.4556812874553204e-05, + "loss": 0.8159, + "step": 2650 + }, + { + "epoch": 0.75, + "learning_rate": 3.445397990237264e-05, + "loss": 0.8204, + "step": 2660 + }, + { + "epoch": 0.76, + "learning_rate": 3.4350959942800584e-05, + "loss": 0.8013, + "step": 2670 + }, + { + "epoch": 0.76, + "learning_rate": 3.424775503343747e-05, + "loss": 0.8196, + "step": 2680 + }, + { + "epoch": 0.76, + "learning_rate": 3.414436721554179e-05, + "loss": 0.802, + "step": 2690 + }, + { + "epoch": 0.76, + "learning_rate": 3.4040798533989745e-05, + "loss": 0.8204, + "step": 2700 + }, + { + "epoch": 0.77, + "learning_rate": 3.3937051037234745e-05, + "loss": 0.8055, + "step": 2710 + }, + { + "epoch": 0.77, + "learning_rate": 3.3833126777266974e-05, + "loss": 0.8171, + "step": 2720 + }, + { + "epoch": 0.77, + "learning_rate": 3.3729027809572735e-05, + "loss": 0.8222, + "step": 2730 + }, + { + "epoch": 0.78, + "learning_rate": 3.3624756193093835e-05, + "loss": 0.8104, + "step": 2740 + }, + { + "epoch": 0.78, + "learning_rate": 3.3520313990186856e-05, + "loss": 0.8147, + "step": 2750 + }, + { + "epoch": 0.78, + "learning_rate": 3.341570326658232e-05, + "loss": 0.8017, + "step": 2760 + }, + { + "epoch": 0.78, + "learning_rate": 3.331092609134392e-05, + "loss": 0.8059, + "step": 2770 + }, + { + "epoch": 0.79, + "learning_rate": 3.32059845368275e-05, + "loss": 0.8204, + "step": 2780 + }, + { + "epoch": 0.79, + "learning_rate": 3.310088067864015e-05, + "loss": 0.812, + "step": 2790 + }, + { + "epoch": 0.79, + "learning_rate": 3.299561659559909e-05, + "loss": 0.8087, + "step": 2800 + }, + { + "epoch": 0.8, + "learning_rate": 3.289019436969057e-05, + "loss": 0.8038, + "step": 2810 + }, + { + "epoch": 0.8, + "learning_rate": 3.278461608602873e-05, + "loss": 0.8094, + "step": 2820 + }, + { + "epoch": 0.8, + "learning_rate": 3.267888383281431e-05, + "loss": 0.8182, + "step": 2830 + }, + { + "epoch": 0.8, + "learning_rate": 3.257299970129336e-05, + "loss": 0.812, + "step": 2840 + }, + { + "epoch": 0.81, + "learning_rate": 3.246696578571592e-05, + "loss": 0.809, + "step": 2850 + }, + { + "epoch": 0.81, + "learning_rate": 3.236078418329452e-05, + "loss": 0.8288, + "step": 2860 + }, + { + "epoch": 0.81, + "learning_rate": 3.225445699416276e-05, + "loss": 0.808, + "step": 2870 + }, + { + "epoch": 0.82, + "learning_rate": 3.214798632133376e-05, + "loss": 0.8127, + "step": 2880 + }, + { + "epoch": 0.82, + "learning_rate": 3.204137427065857e-05, + "loss": 0.8159, + "step": 2890 + }, + { + "epoch": 0.82, + "learning_rate": 3.193462295078448e-05, + "loss": 0.819, + "step": 2900 + }, + { + "epoch": 0.82, + "learning_rate": 3.1827734473113356e-05, + "loss": 0.8108, + "step": 2910 + }, + { + "epoch": 0.83, + "learning_rate": 3.172071095175989e-05, + "loss": 0.8199, + "step": 2920 + }, + { + "epoch": 0.83, + "learning_rate": 3.1613554503509715e-05, + "loss": 0.7977, + "step": 2930 + }, + { + "epoch": 0.83, + "learning_rate": 3.1506267247777645e-05, + "loss": 0.8171, + "step": 2940 + }, + { + "epoch": 0.84, + "learning_rate": 3.139885130656563e-05, + "loss": 0.8064, + "step": 2950 + }, + { + "epoch": 0.84, + "learning_rate": 3.129130880442091e-05, + "loss": 0.8087, + "step": 2960 + }, + { + "epoch": 0.84, + "learning_rate": 3.118364186839389e-05, + "loss": 0.8023, + "step": 2970 + }, + { + "epoch": 0.84, + "learning_rate": 3.107585262799613e-05, + "loss": 0.7978, + "step": 2980 + }, + { + "epoch": 0.85, + "learning_rate": 3.096794321515823e-05, + "loss": 0.8268, + "step": 2990 + }, + { + "epoch": 0.85, + "learning_rate": 3.0859915764187616e-05, + "loss": 0.8129, + "step": 3000 + }, + { + "epoch": 0.85, + "learning_rate": 3.075177241172637e-05, + "loss": 0.8121, + "step": 3010 + }, + { + "epoch": 0.86, + "learning_rate": 3.064351529670895e-05, + "loss": 0.8018, + "step": 3020 + }, + { + "epoch": 0.86, + "learning_rate": 3.0535146560319895e-05, + "loss": 0.8191, + "step": 3030 + }, + { + "epoch": 0.86, + "learning_rate": 3.0426668345951448e-05, + "loss": 0.813, + "step": 3040 + }, + { + "epoch": 0.86, + "learning_rate": 3.031808279916121e-05, + "loss": 0.8252, + "step": 3050 + }, + { + "epoch": 0.87, + "learning_rate": 3.0209392067629676e-05, + "loss": 0.7995, + "step": 3060 + }, + { + "epoch": 0.87, + "learning_rate": 3.010059830111773e-05, + "loss": 0.8162, + "step": 3070 + }, + { + "epoch": 0.87, + "learning_rate": 2.9991703651424184e-05, + "loss": 0.8175, + "step": 3080 + }, + { + "epoch": 0.87, + "learning_rate": 2.988271027234317e-05, + "loss": 0.8076, + "step": 3090 + }, + { + "epoch": 0.88, + "learning_rate": 2.977362031962158e-05, + "loss": 0.8063, + "step": 3100 + }, + { + "epoch": 0.88, + "learning_rate": 2.966443595091637e-05, + "loss": 0.8159, + "step": 3110 + }, + { + "epoch": 0.88, + "learning_rate": 2.9555159325751947e-05, + "loss": 0.8083, + "step": 3120 + }, + { + "epoch": 0.89, + "learning_rate": 2.9445792605477433e-05, + "loss": 0.807, + "step": 3130 + }, + { + "epoch": 0.89, + "learning_rate": 2.933633795322391e-05, + "loss": 0.8123, + "step": 3140 + }, + { + "epoch": 0.89, + "learning_rate": 2.9226797533861615e-05, + "loss": 0.8107, + "step": 3150 + }, + { + "epoch": 0.89, + "learning_rate": 2.9117173513957186e-05, + "loss": 0.8053, + "step": 3160 + }, + { + "epoch": 0.9, + "learning_rate": 2.900746806173074e-05, + "loss": 0.8068, + "step": 3170 + }, + { + "epoch": 0.9, + "learning_rate": 2.889768334701305e-05, + "loss": 0.8086, + "step": 3180 + }, + { + "epoch": 0.9, + "learning_rate": 2.8787821541202564e-05, + "loss": 0.8042, + "step": 3190 + }, + { + "epoch": 0.91, + "learning_rate": 2.8677884817222505e-05, + "loss": 0.8019, + "step": 3200 + }, + { + "epoch": 0.91, + "learning_rate": 2.856787534947789e-05, + "loss": 0.8117, + "step": 3210 + }, + { + "epoch": 0.91, + "learning_rate": 2.8457795313812507e-05, + "loss": 0.8243, + "step": 3220 + }, + { + "epoch": 0.91, + "learning_rate": 2.8347646887465867e-05, + "loss": 0.7953, + "step": 3230 + }, + { + "epoch": 0.92, + "learning_rate": 2.8237432249030183e-05, + "loss": 0.8042, + "step": 3240 + }, + { + "epoch": 0.92, + "learning_rate": 2.812715357840725e-05, + "loss": 0.799, + "step": 3250 + }, + { + "epoch": 0.92, + "learning_rate": 2.801681305676534e-05, + "loss": 0.8093, + "step": 3260 + }, + { + "epoch": 0.93, + "learning_rate": 2.7906412866496034e-05, + "loss": 0.8048, + "step": 3270 + }, + { + "epoch": 0.93, + "learning_rate": 2.7795955191171114e-05, + "loss": 0.8116, + "step": 3280 + }, + { + "epoch": 0.93, + "learning_rate": 2.7685442215499323e-05, + "loss": 0.8151, + "step": 3290 + }, + { + "epoch": 0.93, + "learning_rate": 2.7574876125283176e-05, + "loss": 0.8017, + "step": 3300 + }, + { + "epoch": 0.94, + "learning_rate": 2.7464259107375722e-05, + "loss": 0.8051, + "step": 3310 + }, + { + "epoch": 0.94, + "learning_rate": 2.7353593349637297e-05, + "loss": 0.803, + "step": 3320 + }, + { + "epoch": 0.94, + "learning_rate": 2.7242881040892255e-05, + "loss": 0.8094, + "step": 3330 + }, + { + "epoch": 0.95, + "learning_rate": 2.713212437088564e-05, + "loss": 0.8186, + "step": 3340 + }, + { + "epoch": 0.95, + "learning_rate": 2.702132553023993e-05, + "loss": 0.8041, + "step": 3350 + }, + { + "epoch": 0.95, + "learning_rate": 2.691048671041169e-05, + "loss": 0.8009, + "step": 3360 + }, + { + "epoch": 0.95, + "learning_rate": 2.6799610103648197e-05, + "loss": 0.7931, + "step": 3370 + }, + { + "epoch": 0.96, + "learning_rate": 2.668869790294411e-05, + "loss": 0.8001, + "step": 3380 + }, + { + "epoch": 0.96, + "learning_rate": 2.6577752301998098e-05, + "loss": 0.8167, + "step": 3390 + }, + { + "epoch": 0.96, + "learning_rate": 2.6466775495169437e-05, + "loss": 0.8114, + "step": 3400 + }, + { + "epoch": 0.97, + "learning_rate": 2.6355769677434628e-05, + "loss": 0.8026, + "step": 3410 + }, + { + "epoch": 0.97, + "learning_rate": 2.6244737044343954e-05, + "loss": 0.8063, + "step": 3420 + }, + { + "epoch": 0.97, + "learning_rate": 2.6133679791978065e-05, + "loss": 0.8087, + "step": 3430 + }, + { + "epoch": 0.97, + "learning_rate": 2.602260011690457e-05, + "loss": 0.812, + "step": 3440 + }, + { + "epoch": 0.98, + "learning_rate": 2.591150021613456e-05, + "loss": 0.7899, + "step": 3450 + }, + { + "epoch": 0.98, + "learning_rate": 2.580038228707916e-05, + "loss": 0.798, + "step": 3460 + }, + { + "epoch": 0.98, + "learning_rate": 2.568924852750607e-05, + "loss": 0.826, + "step": 3470 + }, + { + "epoch": 0.99, + "learning_rate": 2.55781011354961e-05, + "loss": 0.8111, + "step": 3480 + }, + { + "epoch": 0.99, + "learning_rate": 2.5466942309399706e-05, + "loss": 0.7924, + "step": 3490 + }, + { + "epoch": 0.99, + "learning_rate": 2.535577424779347e-05, + "loss": 0.8001, + "step": 3500 + }, + { + "epoch": 0.99, + "learning_rate": 2.5244599149436642e-05, + "loss": 0.7906, + "step": 3510 + }, + { + "epoch": 1.0, + "learning_rate": 2.5133419213227684e-05, + "loss": 0.804, + "step": 3520 + }, + { + "epoch": 1.0, + "learning_rate": 2.5022236638160712e-05, + "loss": 0.8123, + "step": 3530 + }, + { + "epoch": 1.0, + "learning_rate": 2.491105362328204e-05, + "loss": 0.8164, + "step": 3540 + }, + { + "epoch": 1.01, + "learning_rate": 2.4799872367646685e-05, + "loss": 0.8169, + "step": 3550 + }, + { + "epoch": 1.01, + "learning_rate": 2.468869507027486e-05, + "loss": 0.7835, + "step": 3560 + }, + { + "epoch": 1.01, + "learning_rate": 2.457752393010851e-05, + "loss": 0.8199, + "step": 3570 + }, + { + "epoch": 1.01, + "learning_rate": 2.4466361145967782e-05, + "loss": 0.8096, + "step": 3580 + }, + { + "epoch": 1.02, + "learning_rate": 2.4355208916507554e-05, + "loss": 0.7792, + "step": 3590 + }, + { + "epoch": 1.02, + "learning_rate": 2.4244069440173938e-05, + "loss": 0.7789, + "step": 3600 + }, + { + "epoch": 1.02, + "learning_rate": 2.413294491516083e-05, + "loss": 0.8127, + "step": 3610 + }, + { + "epoch": 1.02, + "learning_rate": 2.402183753936639e-05, + "loss": 0.816, + "step": 3620 + }, + { + "epoch": 1.03, + "learning_rate": 2.3910749510349574e-05, + "loss": 0.8045, + "step": 3630 + }, + { + "epoch": 1.03, + "learning_rate": 2.3799683025286727e-05, + "loss": 0.8065, + "step": 3640 + }, + { + "epoch": 1.03, + "learning_rate": 2.3688640280928043e-05, + "loss": 0.8016, + "step": 3650 + }, + { + "epoch": 1.04, + "learning_rate": 2.357762347355418e-05, + "loss": 0.7902, + "step": 3660 + }, + { + "epoch": 1.04, + "learning_rate": 2.346663479893277e-05, + "loss": 0.8044, + "step": 3670 + }, + { + "epoch": 1.04, + "learning_rate": 2.3355676452275057e-05, + "loss": 0.8136, + "step": 3680 + }, + { + "epoch": 1.04, + "learning_rate": 2.3244750628192395e-05, + "loss": 0.7885, + "step": 3690 + }, + { + "epoch": 1.05, + "learning_rate": 2.313385952065291e-05, + "loss": 0.7734, + "step": 3700 + }, + { + "epoch": 1.05, + "learning_rate": 2.302300532293806e-05, + "loss": 0.8117, + "step": 3710 + }, + { + "epoch": 1.05, + "learning_rate": 2.2912190227599305e-05, + "loss": 0.7969, + "step": 3720 + }, + { + "epoch": 1.06, + "learning_rate": 2.280141642641468e-05, + "loss": 0.7741, + "step": 3730 + }, + { + "epoch": 1.06, + "learning_rate": 2.26906861103455e-05, + "loss": 0.7996, + "step": 3740 + }, + { + "epoch": 1.06, + "learning_rate": 2.2580001469492968e-05, + "loss": 0.806, + "step": 3750 + }, + { + "epoch": 1.06, + "learning_rate": 2.2469364693054938e-05, + "loss": 0.7969, + "step": 3760 + }, + { + "epoch": 1.07, + "learning_rate": 2.235877796928252e-05, + "loss": 0.8017, + "step": 3770 + }, + { + "epoch": 1.07, + "learning_rate": 2.2248243485436892e-05, + "loss": 0.8066, + "step": 3780 + }, + { + "epoch": 1.07, + "learning_rate": 2.213776342774595e-05, + "loss": 0.7969, + "step": 3790 + }, + { + "epoch": 1.08, + "learning_rate": 2.2027339981361156e-05, + "loss": 0.8008, + "step": 3800 + }, + { + "epoch": 1.08, + "learning_rate": 2.1916975330314235e-05, + "loss": 0.8111, + "step": 3810 + }, + { + "epoch": 1.08, + "learning_rate": 2.1806671657474048e-05, + "loss": 0.7797, + "step": 3820 + }, + { + "epoch": 1.08, + "learning_rate": 2.1696431144503356e-05, + "loss": 0.8016, + "step": 3830 + }, + { + "epoch": 1.09, + "learning_rate": 2.1586255971815738e-05, + "loss": 0.7962, + "step": 3840 + }, + { + "epoch": 1.09, + "learning_rate": 2.147614831853239e-05, + "loss": 0.7897, + "step": 3850 + }, + { + "epoch": 1.09, + "learning_rate": 2.136611036243908e-05, + "loss": 0.7951, + "step": 3860 + }, + { + "epoch": 1.1, + "learning_rate": 2.1256144279943066e-05, + "loss": 0.7856, + "step": 3870 + }, + { + "epoch": 1.1, + "learning_rate": 2.114625224603002e-05, + "loss": 0.7823, + "step": 3880 + }, + { + "epoch": 1.1, + "learning_rate": 2.1036436434221048e-05, + "loss": 0.8101, + "step": 3890 + }, + { + "epoch": 1.1, + "learning_rate": 2.0926699016529656e-05, + "loss": 0.7789, + "step": 3900 + }, + { + "epoch": 1.11, + "learning_rate": 2.0817042163418858e-05, + "loss": 0.7993, + "step": 3910 + }, + { + "epoch": 1.11, + "learning_rate": 2.0707468043758156e-05, + "loss": 0.8107, + "step": 3920 + }, + { + "epoch": 1.11, + "learning_rate": 2.059797882478074e-05, + "loss": 0.8005, + "step": 3930 + }, + { + "epoch": 1.12, + "learning_rate": 2.048857667204053e-05, + "loss": 0.8144, + "step": 3940 + }, + { + "epoch": 1.12, + "learning_rate": 2.0379263749369434e-05, + "loss": 0.7894, + "step": 3950 + }, + { + "epoch": 1.12, + "learning_rate": 2.027004221883447e-05, + "loss": 0.7763, + "step": 3960 + }, + { + "epoch": 1.12, + "learning_rate": 2.016091424069506e-05, + "loss": 0.781, + "step": 3970 + }, + { + "epoch": 1.13, + "learning_rate": 2.0051881973360266e-05, + "loss": 0.7878, + "step": 3980 + }, + { + "epoch": 1.13, + "learning_rate": 1.9942947573346133e-05, + "loss": 0.7956, + "step": 3990 + }, + { + "epoch": 1.13, + "learning_rate": 1.9834113195233e-05, + "loss": 0.8036, + "step": 4000 + }, + { + "epoch": 1.14, + "learning_rate": 1.9725380991622923e-05, + "loss": 0.7945, + "step": 4010 + }, + { + "epoch": 1.14, + "learning_rate": 1.961675311309705e-05, + "loss": 0.7955, + "step": 4020 + }, + { + "epoch": 1.14, + "learning_rate": 1.9508231708173146e-05, + "loss": 0.7772, + "step": 4030 + }, + { + "epoch": 1.14, + "learning_rate": 1.9399818923263056e-05, + "loss": 0.7805, + "step": 4040 + }, + { + "epoch": 1.15, + "learning_rate": 1.929151690263026e-05, + "loss": 0.798, + "step": 4050 + }, + { + "epoch": 1.15, + "learning_rate": 1.918332778834745e-05, + "loss": 0.8183, + "step": 4060 + }, + { + "epoch": 1.15, + "learning_rate": 1.9075253720254217e-05, + "loss": 0.8106, + "step": 4070 + }, + { + "epoch": 1.16, + "learning_rate": 1.8967296835914643e-05, + "loss": 0.7918, + "step": 4080 + }, + { + "epoch": 1.16, + "learning_rate": 1.885945927057511e-05, + "loss": 0.779, + "step": 4090 + }, + { + "epoch": 1.16, + "learning_rate": 1.8751743157122003e-05, + "loss": 0.7881, + "step": 4100 + }, + { + "epoch": 1.16, + "learning_rate": 1.8644150626039534e-05, + "loss": 0.7952, + "step": 4110 + }, + { + "epoch": 1.17, + "learning_rate": 1.8536683805367656e-05, + "loss": 0.7971, + "step": 4120 + }, + { + "epoch": 1.17, + "learning_rate": 1.8429344820659892e-05, + "loss": 0.8005, + "step": 4130 + }, + { + "epoch": 1.17, + "learning_rate": 1.832213579494137e-05, + "loss": 0.8014, + "step": 4140 + }, + { + "epoch": 1.17, + "learning_rate": 1.8215058848666765e-05, + "loss": 0.7883, + "step": 4150 + }, + { + "epoch": 1.18, + "learning_rate": 1.810811609967844e-05, + "loss": 0.7887, + "step": 4160 + }, + { + "epoch": 1.18, + "learning_rate": 1.8001309663164457e-05, + "loss": 0.7719, + "step": 4170 + }, + { + "epoch": 1.18, + "learning_rate": 1.7894641651616838e-05, + "loss": 0.8098, + "step": 4180 + }, + { + "epoch": 1.19, + "learning_rate": 1.7788114174789706e-05, + "loss": 0.7909, + "step": 4190 + }, + { + "epoch": 1.19, + "learning_rate": 1.7681729339657626e-05, + "loss": 0.7791, + "step": 4200 + }, + { + "epoch": 1.19, + "learning_rate": 1.7575489250373867e-05, + "loss": 0.7946, + "step": 4210 + }, + { + "epoch": 1.19, + "learning_rate": 1.746939600822883e-05, + "loss": 0.7973, + "step": 4220 + }, + { + "epoch": 1.2, + "learning_rate": 1.7363451711608445e-05, + "loss": 0.7961, + "step": 4230 + }, + { + "epoch": 1.2, + "learning_rate": 1.7257658455952747e-05, + "loss": 0.797, + "step": 4240 + }, + { + "epoch": 1.2, + "learning_rate": 1.715201833371432e-05, + "loss": 0.7961, + "step": 4250 + }, + { + "epoch": 1.21, + "learning_rate": 1.7046533434317008e-05, + "loss": 0.7918, + "step": 4260 + }, + { + "epoch": 1.21, + "learning_rate": 1.6941205844114522e-05, + "loss": 0.7868, + "step": 4270 + }, + { + "epoch": 1.21, + "learning_rate": 1.683603764634923e-05, + "loss": 0.7843, + "step": 4280 + }, + { + "epoch": 1.21, + "learning_rate": 1.6731030921110903e-05, + "loss": 0.7968, + "step": 4290 + }, + { + "epoch": 1.22, + "learning_rate": 1.6626187745295608e-05, + "loss": 0.7917, + "step": 4300 + }, + { + "epoch": 1.22, + "learning_rate": 1.65215101925646e-05, + "loss": 0.7872, + "step": 4310 + }, + { + "epoch": 1.22, + "learning_rate": 1.641700033330336e-05, + "loss": 0.777, + "step": 4320 + }, + { + "epoch": 1.23, + "learning_rate": 1.6312660234580585e-05, + "loss": 0.8049, + "step": 4330 + }, + { + "epoch": 1.23, + "learning_rate": 1.6208491960107324e-05, + "loss": 0.7897, + "step": 4340 + }, + { + "epoch": 1.23, + "learning_rate": 1.6104497570196193e-05, + "loss": 0.792, + "step": 4350 + }, + { + "epoch": 1.23, + "learning_rate": 1.600067912172057e-05, + "loss": 0.7866, + "step": 4360 + }, + { + "epoch": 1.24, + "learning_rate": 1.5897038668073965e-05, + "loss": 0.8061, + "step": 4370 + }, + { + "epoch": 1.24, + "learning_rate": 1.5793578259129355e-05, + "loss": 0.777, + "step": 4380 + }, + { + "epoch": 1.24, + "learning_rate": 1.5690299941198706e-05, + "loss": 0.7883, + "step": 4390 + }, + { + "epoch": 1.25, + "learning_rate": 1.558720575699242e-05, + "loss": 0.7897, + "step": 4400 + }, + { + "epoch": 1.25, + "learning_rate": 1.548429774557901e-05, + "loss": 0.8014, + "step": 4410 + }, + { + "epoch": 1.25, + "learning_rate": 1.5381577942344688e-05, + "loss": 0.7882, + "step": 4420 + }, + { + "epoch": 1.25, + "learning_rate": 1.5279048378953222e-05, + "loss": 0.7839, + "step": 4430 + }, + { + "epoch": 1.26, + "learning_rate": 1.517671108330561e-05, + "loss": 0.794, + "step": 4440 + }, + { + "epoch": 1.26, + "learning_rate": 1.5074568079500109e-05, + "loss": 0.7739, + "step": 4450 + }, + { + "epoch": 1.26, + "learning_rate": 1.497262138779208e-05, + "loss": 0.7911, + "step": 4460 + }, + { + "epoch": 1.27, + "learning_rate": 1.4870873024554138e-05, + "loss": 0.7907, + "step": 4470 + }, + { + "epoch": 1.27, + "learning_rate": 1.4769325002236183e-05, + "loss": 0.803, + "step": 4480 + }, + { + "epoch": 1.27, + "learning_rate": 1.4667979329325651e-05, + "loss": 0.8048, + "step": 4490 + }, + { + "epoch": 1.27, + "learning_rate": 1.4566838010307754e-05, + "loss": 0.7816, + "step": 4500 + }, + { + "epoch": 1.28, + "learning_rate": 1.4465903045625878e-05, + "loss": 0.7765, + "step": 4510 + }, + { + "epoch": 1.28, + "learning_rate": 1.4365176431641958e-05, + "loss": 0.7916, + "step": 4520 + }, + { + "epoch": 1.28, + "learning_rate": 1.4264660160597057e-05, + "loss": 0.8015, + "step": 4530 + }, + { + "epoch": 1.29, + "learning_rate": 1.41643562205719e-05, + "loss": 0.7826, + "step": 4540 + }, + { + "epoch": 1.29, + "learning_rate": 1.4064266595447584e-05, + "loss": 0.7834, + "step": 4550 + }, + { + "epoch": 1.29, + "learning_rate": 1.3964393264866368e-05, + "loss": 0.7873, + "step": 4560 + }, + { + "epoch": 1.29, + "learning_rate": 1.386473820419244e-05, + "loss": 0.8033, + "step": 4570 + }, + { + "epoch": 1.3, + "learning_rate": 1.376530338447294e-05, + "loss": 0.7973, + "step": 4580 + }, + { + "epoch": 1.3, + "learning_rate": 1.366609077239889e-05, + "loss": 0.7736, + "step": 4590 + }, + { + "epoch": 1.3, + "learning_rate": 1.3567102330266369e-05, + "loss": 0.7968, + "step": 4600 + }, + { + "epoch": 1.31, + "learning_rate": 1.3468340015937642e-05, + "loss": 0.7773, + "step": 4610 + }, + { + "epoch": 1.31, + "learning_rate": 1.3369805782802467e-05, + "loss": 0.7971, + "step": 4620 + }, + { + "epoch": 1.31, + "learning_rate": 1.3271501579739449e-05, + "loss": 0.7808, + "step": 4630 + }, + { + "epoch": 1.31, + "learning_rate": 1.317342935107752e-05, + "loss": 0.7826, + "step": 4640 + }, + { + "epoch": 1.32, + "learning_rate": 1.307559103655743e-05, + "loss": 0.7767, + "step": 4650 + }, + { + "epoch": 1.32, + "learning_rate": 1.2977988571293447e-05, + "loss": 0.7962, + "step": 4660 + }, + { + "epoch": 1.32, + "learning_rate": 1.288062388573501e-05, + "loss": 0.7876, + "step": 4670 + }, + { + "epoch": 1.33, + "learning_rate": 1.2783498905628622e-05, + "loss": 0.782, + "step": 4680 + }, + { + "epoch": 1.33, + "learning_rate": 1.2686615551979702e-05, + "loss": 0.7926, + "step": 4690 + }, + { + "epoch": 1.33, + "learning_rate": 1.2589975741014615e-05, + "loss": 0.7939, + "step": 4700 + }, + { + "epoch": 1.33, + "learning_rate": 1.2493581384142767e-05, + "loss": 0.7992, + "step": 4710 + }, + { + "epoch": 1.34, + "learning_rate": 1.2397434387918824e-05, + "loss": 0.7766, + "step": 4720 + }, + { + "epoch": 1.34, + "learning_rate": 1.2301536654004948e-05, + "loss": 0.7887, + "step": 4730 + }, + { + "epoch": 1.34, + "learning_rate": 1.2205890079133252e-05, + "loss": 0.7927, + "step": 4740 + }, + { + "epoch": 1.34, + "learning_rate": 1.2110496555068218e-05, + "loss": 0.786, + "step": 4750 + }, + { + "epoch": 1.35, + "learning_rate": 1.2015357968569335e-05, + "loss": 0.7821, + "step": 4760 + }, + { + "epoch": 1.35, + "learning_rate": 1.1920476201353763e-05, + "loss": 0.7864, + "step": 4770 + }, + { + "epoch": 1.35, + "learning_rate": 1.1825853130059098e-05, + "loss": 0.7888, + "step": 4780 + }, + { + "epoch": 1.36, + "learning_rate": 1.1731490626206263e-05, + "loss": 0.794, + "step": 4790 + }, + { + "epoch": 1.36, + "learning_rate": 1.16373905561625e-05, + "loss": 0.771, + "step": 4800 + }, + { + "epoch": 1.36, + "learning_rate": 1.1543554781104477e-05, + "loss": 0.7984, + "step": 4810 + }, + { + "epoch": 1.36, + "learning_rate": 1.1449985156981413e-05, + "loss": 0.7961, + "step": 4820 + }, + { + "epoch": 1.37, + "learning_rate": 1.1356683534478451e-05, + "loss": 0.7824, + "step": 4830 + }, + { + "epoch": 1.37, + "learning_rate": 1.1263651758979967e-05, + "loss": 0.7867, + "step": 4840 + }, + { + "epoch": 1.37, + "learning_rate": 1.1170891670533162e-05, + "loss": 0.787, + "step": 4850 + }, + { + "epoch": 1.38, + "learning_rate": 1.107840510381158e-05, + "loss": 0.7789, + "step": 4860 + }, + { + "epoch": 1.38, + "learning_rate": 1.0986193888078882e-05, + "loss": 0.7951, + "step": 4870 + }, + { + "epoch": 1.38, + "learning_rate": 1.0894259847152636e-05, + "loss": 0.8037, + "step": 4880 + }, + { + "epoch": 1.38, + "learning_rate": 1.0802604799368274e-05, + "loss": 0.7901, + "step": 4890 + }, + { + "epoch": 1.39, + "learning_rate": 1.0711230557543078e-05, + "loss": 0.7736, + "step": 4900 + }, + { + "epoch": 1.39, + "learning_rate": 1.0620138928940394e-05, + "loss": 0.7743, + "step": 4910 + }, + { + "epoch": 1.39, + "learning_rate": 1.0529331715233795e-05, + "loss": 0.7971, + "step": 4920 + }, + { + "epoch": 1.4, + "learning_rate": 1.0438810712471553e-05, + "loss": 0.7812, + "step": 4930 + }, + { + "epoch": 1.4, + "learning_rate": 1.0348577711041021e-05, + "loss": 0.7788, + "step": 4940 + }, + { + "epoch": 1.4, + "learning_rate": 1.0258634495633277e-05, + "loss": 0.7866, + "step": 4950 + }, + { + "epoch": 1.4, + "learning_rate": 1.0168982845207797e-05, + "loss": 0.8023, + "step": 4960 + }, + { + "epoch": 1.41, + "learning_rate": 1.0079624532957316e-05, + "loss": 0.7766, + "step": 4970 + }, + { + "epoch": 1.41, + "learning_rate": 9.99056132627267e-06, + "loss": 0.7831, + "step": 4980 + }, + { + "epoch": 1.41, + "learning_rate": 9.901794986707941e-06, + "loss": 0.7927, + "step": 4990 + }, + { + "epoch": 1.42, + "learning_rate": 9.813327269945547e-06, + "loss": 0.7852, + "step": 5000 + }, + { + "epoch": 1.42, + "learning_rate": 9.725159925761532e-06, + "loss": 0.7649, + "step": 5010 + }, + { + "epoch": 1.42, + "learning_rate": 9.637294697990961e-06, + "loss": 0.7818, + "step": 5020 + }, + { + "epoch": 1.42, + "learning_rate": 9.549733324493431e-06, + "loss": 0.7789, + "step": 5030 + }, + { + "epoch": 1.43, + "learning_rate": 9.462477537118717e-06, + "loss": 0.7636, + "step": 5040 + }, + { + "epoch": 1.43, + "learning_rate": 9.375529061672467e-06, + "loss": 0.7832, + "step": 5050 + }, + { + "epoch": 1.43, + "learning_rate": 9.288889617882136e-06, + "loss": 0.7959, + "step": 5060 + }, + { + "epoch": 1.44, + "learning_rate": 9.202560919362896e-06, + "loss": 0.7896, + "step": 5070 + }, + { + "epoch": 1.44, + "learning_rate": 9.116544673583824e-06, + "loss": 0.781, + "step": 5080 + }, + { + "epoch": 1.44, + "learning_rate": 9.030842581834062e-06, + "loss": 0.7876, + "step": 5090 + }, + { + "epoch": 1.44, + "learning_rate": 8.945456339189198e-06, + "loss": 0.7818, + "step": 5100 + }, + { + "epoch": 1.45, + "learning_rate": 8.860387634477736e-06, + "loss": 0.7851, + "step": 5110 + }, + { + "epoch": 1.45, + "learning_rate": 8.775638150247714e-06, + "loss": 0.7824, + "step": 5120 + }, + { + "epoch": 1.45, + "learning_rate": 8.691209562733371e-06, + "loss": 0.7988, + "step": 5130 + }, + { + "epoch": 1.46, + "learning_rate": 8.607103541822068e-06, + "loss": 0.7771, + "step": 5140 + }, + { + "epoch": 1.46, + "learning_rate": 8.523321751021176e-06, + "loss": 0.7888, + "step": 5150 + }, + { + "epoch": 1.46, + "learning_rate": 8.43986584742526e-06, + "loss": 0.794, + "step": 5160 + }, + { + "epoch": 1.46, + "learning_rate": 8.35673748168323e-06, + "loss": 0.7854, + "step": 5170 + }, + { + "epoch": 1.47, + "learning_rate": 8.273938297965736e-06, + "loss": 0.7927, + "step": 5180 + }, + { + "epoch": 1.47, + "learning_rate": 8.191469933932625e-06, + "loss": 0.801, + "step": 5190 + }, + { + "epoch": 1.47, + "learning_rate": 8.109334020700591e-06, + "loss": 0.7816, + "step": 5200 + }, + { + "epoch": 1.48, + "learning_rate": 8.027532182810845e-06, + "loss": 0.7912, + "step": 5210 + }, + { + "epoch": 1.48, + "learning_rate": 7.946066038197065e-06, + "loss": 0.7818, + "step": 5220 + }, + { + "epoch": 1.48, + "learning_rate": 7.86493719815333e-06, + "loss": 0.7833, + "step": 5230 + }, + { + "epoch": 1.48, + "learning_rate": 7.784147267302274e-06, + "loss": 0.7919, + "step": 5240 + }, + { + "epoch": 1.49, + "learning_rate": 7.70369784356336e-06, + "loss": 0.771, + "step": 5250 + }, + { + "epoch": 1.49, + "learning_rate": 7.62359051812124e-06, + "loss": 0.7887, + "step": 5260 + }, + { + "epoch": 1.49, + "learning_rate": 7.543826875394347e-06, + "loss": 0.7744, + "step": 5270 + }, + { + "epoch": 1.49, + "learning_rate": 7.464408493003483e-06, + "loss": 0.7887, + "step": 5280 + }, + { + "epoch": 1.5, + "learning_rate": 7.385336941740678e-06, + "loss": 0.7638, + "step": 5290 + }, + { + "epoch": 1.5, + "learning_rate": 7.306613785538066e-06, + "loss": 0.7778, + "step": 5300 + }, + { + "epoch": 1.5, + "learning_rate": 7.2282405814370125e-06, + "loss": 0.7769, + "step": 5310 + }, + { + "epoch": 1.51, + "learning_rate": 7.150218879557263e-06, + "loss": 0.7916, + "step": 5320 + }, + { + "epoch": 1.51, + "learning_rate": 7.072550223066321e-06, + "loss": 0.7798, + "step": 5330 + }, + { + "epoch": 1.51, + "learning_rate": 6.9952361481488896e-06, + "loss": 0.7733, + "step": 5340 + }, + { + "epoch": 1.51, + "learning_rate": 6.918278183976554e-06, + "loss": 0.7701, + "step": 5350 + }, + { + "epoch": 1.52, + "learning_rate": 6.841677852677447e-06, + "loss": 0.7792, + "step": 5360 + }, + { + "epoch": 1.52, + "learning_rate": 6.765436669306227e-06, + "loss": 0.7863, + "step": 5370 + }, + { + "epoch": 1.52, + "learning_rate": 6.689556141814043e-06, + "loss": 0.7821, + "step": 5380 + }, + { + "epoch": 1.53, + "learning_rate": 6.614037771018775e-06, + "loss": 0.7896, + "step": 5390 + }, + { + "epoch": 1.53, + "learning_rate": 6.538883050575284e-06, + "loss": 0.7943, + "step": 5400 + }, + { + "epoch": 1.53, + "learning_rate": 6.464093466945919e-06, + "loss": 0.7933, + "step": 5410 + }, + { + "epoch": 1.53, + "learning_rate": 6.389670499371089e-06, + "loss": 0.7773, + "step": 5420 + }, + { + "epoch": 1.54, + "learning_rate": 6.3156156198400315e-06, + "loss": 0.7828, + "step": 5430 + }, + { + "epoch": 1.54, + "learning_rate": 6.241930293061662e-06, + "loss": 0.7769, + "step": 5440 + }, + { + "epoch": 1.54, + "learning_rate": 6.16861597643564e-06, + "loss": 0.7726, + "step": 5450 + }, + { + "epoch": 1.55, + "learning_rate": 6.0956741200235315e-06, + "loss": 0.7956, + "step": 5460 + }, + { + "epoch": 1.55, + "learning_rate": 6.023106166520104e-06, + "loss": 0.7932, + "step": 5470 + }, + { + "epoch": 1.55, + "learning_rate": 5.950913551224838e-06, + "loss": 0.7849, + "step": 5480 + }, + { + "epoch": 1.55, + "learning_rate": 5.879097702013495e-06, + "loss": 0.7968, + "step": 5490 + }, + { + "epoch": 1.56, + "learning_rate": 5.807660039309904e-06, + "loss": 0.7827, + "step": 5500 + }, + { + "epoch": 1.56, + "learning_rate": 5.736601976057848e-06, + "loss": 0.791, + "step": 5510 + }, + { + "epoch": 1.56, + "learning_rate": 5.66592491769315e-06, + "loss": 0.7792, + "step": 5520 + }, + { + "epoch": 1.57, + "learning_rate": 5.595630262115825e-06, + "loss": 0.7808, + "step": 5530 + }, + { + "epoch": 1.57, + "learning_rate": 5.525719399662488e-06, + "loss": 0.7723, + "step": 5540 + }, + { + "epoch": 1.57, + "learning_rate": 5.456193713078797e-06, + "loss": 0.7789, + "step": 5550 + }, + { + "epoch": 1.57, + "learning_rate": 5.387054577492165e-06, + "loss": 0.7903, + "step": 5560 + }, + { + "epoch": 1.58, + "learning_rate": 5.318303360384508e-06, + "loss": 0.7801, + "step": 5570 + }, + { + "epoch": 1.58, + "learning_rate": 5.249941421565227e-06, + "loss": 0.7733, + "step": 5580 + }, + { + "epoch": 1.58, + "learning_rate": 5.181970113144296e-06, + "loss": 0.7891, + "step": 5590 + }, + { + "epoch": 1.59, + "learning_rate": 5.114390779505557e-06, + "loss": 0.7912, + "step": 5600 + }, + { + "epoch": 1.59, + "learning_rate": 5.047204757280072e-06, + "loss": 0.7917, + "step": 5610 + }, + { + "epoch": 1.59, + "learning_rate": 4.980413375319737e-06, + "loss": 0.7922, + "step": 5620 + }, + { + "epoch": 1.59, + "learning_rate": 4.914017954670961e-06, + "loss": 0.79, + "step": 5630 + }, + { + "epoch": 1.6, + "learning_rate": 4.8480198085485765e-06, + "loss": 0.7844, + "step": 5640 + }, + { + "epoch": 1.6, + "learning_rate": 4.782420242309821e-06, + "loss": 0.7855, + "step": 5650 + }, + { + "epoch": 1.6, + "learning_rate": 4.717220553428559e-06, + "loss": 0.779, + "step": 5660 + }, + { + "epoch": 1.61, + "learning_rate": 4.652422031469583e-06, + "loss": 0.7864, + "step": 5670 + }, + { + "epoch": 1.61, + "learning_rate": 4.58802595806315e-06, + "loss": 0.7802, + "step": 5680 + }, + { + "epoch": 1.61, + "learning_rate": 4.524033606879602e-06, + "loss": 0.7776, + "step": 5690 + }, + { + "epoch": 1.61, + "learning_rate": 4.460446243604169e-06, + "loss": 0.778, + "step": 5700 + }, + { + "epoch": 1.62, + "learning_rate": 4.3972651259119706e-06, + "loss": 0.7834, + "step": 5710 + }, + { + "epoch": 1.62, + "learning_rate": 4.3344915034431e-06, + "loss": 0.7875, + "step": 5720 + }, + { + "epoch": 1.62, + "learning_rate": 4.272126617777933e-06, + "loss": 0.787, + "step": 5730 + }, + { + "epoch": 1.63, + "learning_rate": 4.2101717024125576e-06, + "loss": 0.7773, + "step": 5740 + }, + { + "epoch": 1.63, + "learning_rate": 4.148627982734404e-06, + "loss": 0.7853, + "step": 5750 + }, + { + "epoch": 1.63, + "learning_rate": 4.087496675997965e-06, + "loss": 0.7917, + "step": 5760 + }, + { + "epoch": 1.63, + "learning_rate": 4.026778991300762e-06, + "loss": 0.7907, + "step": 5770 + }, + { + "epoch": 1.64, + "learning_rate": 3.966476129559391e-06, + "loss": 0.7764, + "step": 5780 + }, + { + "epoch": 1.64, + "learning_rate": 3.90658928348582e-06, + "loss": 0.7718, + "step": 5790 + }, + { + "epoch": 1.64, + "learning_rate": 3.847119637563739e-06, + "loss": 0.791, + "step": 5800 + }, + { + "epoch": 1.64, + "learning_rate": 3.7880683680251855e-06, + "loss": 0.7732, + "step": 5810 + }, + { + "epoch": 1.65, + "learning_rate": 3.7294366428272386e-06, + "loss": 0.7621, + "step": 5820 + }, + { + "epoch": 1.65, + "learning_rate": 3.6712256216289624e-06, + "loss": 0.7619, + "step": 5830 + }, + { + "epoch": 1.65, + "learning_rate": 3.613436455768418e-06, + "loss": 0.782, + "step": 5840 + }, + { + "epoch": 1.66, + "learning_rate": 3.5560702882399406e-06, + "loss": 0.7853, + "step": 5850 + }, + { + "epoch": 1.66, + "learning_rate": 3.499128253671494e-06, + "loss": 0.7896, + "step": 5860 + }, + { + "epoch": 1.66, + "learning_rate": 3.4426114783022546e-06, + "loss": 0.7939, + "step": 5870 + }, + { + "epoch": 1.66, + "learning_rate": 3.3865210799603253e-06, + "loss": 0.7734, + "step": 5880 + }, + { + "epoch": 1.67, + "learning_rate": 3.3308581680406182e-06, + "loss": 0.7951, + "step": 5890 + }, + { + "epoch": 1.67, + "learning_rate": 3.275623843482939e-06, + "loss": 0.7892, + "step": 5900 + }, + { + "epoch": 1.67, + "learning_rate": 3.220819198750172e-06, + "loss": 0.7788, + "step": 5910 + }, + { + "epoch": 1.68, + "learning_rate": 3.166445317806721e-06, + "loss": 0.8137, + "step": 5920 + }, + { + "epoch": 1.68, + "learning_rate": 3.1125032760970203e-06, + "loss": 0.7665, + "step": 5930 + }, + { + "epoch": 1.68, + "learning_rate": 3.0589941405243043e-06, + "loss": 0.7812, + "step": 5940 + }, + { + "epoch": 1.68, + "learning_rate": 3.0059189694294774e-06, + "loss": 0.7824, + "step": 5950 + }, + { + "epoch": 1.69, + "learning_rate": 2.953278812570201e-06, + "loss": 0.7736, + "step": 5960 + }, + { + "epoch": 1.69, + "learning_rate": 2.9010747111001103e-06, + "loss": 0.7759, + "step": 5970 + }, + { + "epoch": 1.69, + "learning_rate": 2.849307697548251e-06, + "loss": 0.7946, + "step": 5980 + }, + { + "epoch": 1.7, + "learning_rate": 2.7979787957986225e-06, + "loss": 0.7938, + "step": 5990 + }, + { + "epoch": 1.7, + "learning_rate": 2.7470890210699596e-06, + "loss": 0.7818, + "step": 6000 + } + ], + "max_steps": 7064, + "num_train_epochs": 2, + "total_flos": 1.0767168490616914e+19, + "trial_name": null, + "trial_params": null +} diff --git a/sft-qlora/checkpoint-6000/training_args.bin b/sft-qlora/checkpoint-6000/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..e8bd5ea7554270f553d5441a16ce5f0105c78887 --- /dev/null +++ b/sft-qlora/checkpoint-6000/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:131cb9a8eab84a15c7b110e05a98a526550eba69b35fa4c758b43a4caafa6db7 +size 3275 diff --git a/sft-qlora/checkpoint-7000/README.md b/sft-qlora/checkpoint-7000/README.md new file mode 100644 index 0000000000000000000000000000000000000000..d290c902d52b2091d490255d35c9be86df84f437 --- /dev/null +++ b/sft-qlora/checkpoint-7000/README.md @@ -0,0 +1,3 @@ +--- +library_name: peft +--- diff --git a/sft-qlora/checkpoint-7000/adapter_config.json b/sft-qlora/checkpoint-7000/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..2ef4676864a7f782259cd6700dcab8059e8973ab --- /dev/null +++ b/sft-qlora/checkpoint-7000/adapter_config.json @@ -0,0 +1,20 @@ +{ + "base_model_name_or_path": "llama-13b-hf/", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layers_pattern": null, + "layers_to_transform": null, + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "modules_to_save": null, + "peft_type": "LORA", + "r": 8, + "revision": null, + "target_modules": [ + "q_proj", + "v_proj" + ], + "task_type": "CAUSAL_LM" +} \ No newline at end of file diff --git a/sft-qlora/checkpoint-7000/adapter_model.bin b/sft-qlora/checkpoint-7000/adapter_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..9fdde5e84b9d5f4a6a846d75a2ae05a991e5d2fa --- /dev/null +++ b/sft-qlora/checkpoint-7000/adapter_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53d89f7cd2d9da3b78c9a18d03c59c32d563fc313b27ac9442e31d609d387de9 +size 26269517 diff --git a/sft-qlora/checkpoint-7000/finetuning_args.json b/sft-qlora/checkpoint-7000/finetuning_args.json new file mode 100644 index 0000000000000000000000000000000000000000..36a921b3eb84159ad54e7697e9d7d3e2fde38fec --- /dev/null +++ b/sft-qlora/checkpoint-7000/finetuning_args.json @@ -0,0 +1,13 @@ +{ + "finetuning_type": "lora", + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "lora_rank": 8, + "lora_target": [ + "q_proj", + "v_proj" + ], + "name_module_trainable": "mlp", + "num_hidden_layers": 32, + "num_layer_trainable": 3 +} diff --git a/sft-qlora/checkpoint-7000/optimizer.pt b/sft-qlora/checkpoint-7000/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc6c5e045f08edb90030d74fe892d50ab1b8794e --- /dev/null +++ b/sft-qlora/checkpoint-7000/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:276a0519e825e22e9789c04afd43692ae245fc3063c3bc37fb60cb1416f14e79 +size 52562821 diff --git a/sft-qlora/checkpoint-7000/rng_state_0.pth b/sft-qlora/checkpoint-7000/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..14de24f9400648b183a1a87d4dba0e3f1442902c --- /dev/null +++ b/sft-qlora/checkpoint-7000/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a41674ee63543d3cd494c5e56b71bf7975ef6eb1a4203ce26ea6a75d229a6459 +size 18679 diff --git a/sft-qlora/checkpoint-7000/rng_state_1.pth b/sft-qlora/checkpoint-7000/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..0c5a3d730073587b4388351a6071e2b78385e036 --- /dev/null +++ b/sft-qlora/checkpoint-7000/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef29132d00d7863f67201df64e6651ada06b7a507c18d22f83d1e0c2cb066dc8 +size 18679 diff --git a/sft-qlora/checkpoint-7000/rng_state_2.pth b/sft-qlora/checkpoint-7000/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..edaa68baac6eb7ac90e06e296c143671a2b426c2 --- /dev/null +++ b/sft-qlora/checkpoint-7000/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5df393134b32648186b44272488442b8b7df7807c197b01a520072901355d41 +size 18679 diff --git a/sft-qlora/checkpoint-7000/rng_state_3.pth b/sft-qlora/checkpoint-7000/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..f2fa2e74ac9f940a3b48fc524c38c346377e88f3 --- /dev/null +++ b/sft-qlora/checkpoint-7000/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29e30d7da079ef2454837d1b8adb93645add57666813a8c7589577abd4d21e21 +size 18679 diff --git a/sft-qlora/checkpoint-7000/scheduler.pt b/sft-qlora/checkpoint-7000/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4328d4843aba209737d3fac94c038527b2553a5 --- /dev/null +++ b/sft-qlora/checkpoint-7000/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c118750b74d5b8fff99b8e7a67475a28dfc9543b920285fa34d7d14c00e052f +size 627 diff --git a/sft-qlora/checkpoint-7000/trainer_state.json b/sft-qlora/checkpoint-7000/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..2c0f652a05335e1e1c365e953b0615bab30ea82d --- /dev/null +++ b/sft-qlora/checkpoint-7000/trainer_state.json @@ -0,0 +1,4216 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 1.9818799546998869, + "global_step": 7000, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.0, + "learning_rate": 4.9999752766303955e-05, + "loss": 1.3185, + "step": 10 + }, + { + "epoch": 0.01, + "learning_rate": 4.999901107010577e-05, + "loss": 1.2795, + "step": 20 + }, + { + "epoch": 0.01, + "learning_rate": 4.999777492607524e-05, + "loss": 1.2266, + "step": 30 + }, + { + "epoch": 0.01, + "learning_rate": 4.9996044358661676e-05, + "loss": 1.19, + "step": 40 + }, + { + "epoch": 0.01, + "learning_rate": 4.9993819402093446e-05, + "loss": 1.1643, + "step": 50 + }, + { + "epoch": 0.02, + "learning_rate": 4.999110010037728e-05, + "loss": 1.1381, + "step": 60 + }, + { + "epoch": 0.02, + "learning_rate": 4.998788650729743e-05, + "loss": 1.1113, + "step": 70 + }, + { + "epoch": 0.02, + "learning_rate": 4.998417868641457e-05, + "loss": 1.0892, + "step": 80 + }, + { + "epoch": 0.03, + "learning_rate": 4.9979976711064556e-05, + "loss": 1.0801, + "step": 90 + }, + { + "epoch": 0.03, + "learning_rate": 4.9975280664357e-05, + "loss": 1.0822, + "step": 100 + }, + { + "epoch": 0.03, + "learning_rate": 4.997009063917356e-05, + "loss": 1.0794, + "step": 110 + }, + { + "epoch": 0.03, + "learning_rate": 4.996440673816617e-05, + "loss": 1.0419, + "step": 120 + }, + { + "epoch": 0.04, + "learning_rate": 4.995822907375498e-05, + "loss": 1.049, + "step": 130 + }, + { + "epoch": 0.04, + "learning_rate": 4.9951557768126136e-05, + "loss": 1.0202, + "step": 140 + }, + { + "epoch": 0.04, + "learning_rate": 4.9944392953229365e-05, + "loss": 1.0226, + "step": 150 + }, + { + "epoch": 0.05, + "learning_rate": 4.993673477077535e-05, + "loss": 0.9927, + "step": 160 + }, + { + "epoch": 0.05, + "learning_rate": 4.9928583372232954e-05, + "loss": 1.0006, + "step": 170 + }, + { + "epoch": 0.05, + "learning_rate": 4.991993891882622e-05, + "loss": 0.9999, + "step": 180 + }, + { + "epoch": 0.05, + "learning_rate": 4.991080158153115e-05, + "loss": 1.0003, + "step": 190 + }, + { + "epoch": 0.06, + "learning_rate": 4.990117154107236e-05, + "loss": 0.9875, + "step": 200 + }, + { + "epoch": 0.06, + "learning_rate": 4.989104898791949e-05, + "loss": 1.004, + "step": 210 + }, + { + "epoch": 0.06, + "learning_rate": 4.988043412228343e-05, + "loss": 0.9835, + "step": 220 + }, + { + "epoch": 0.07, + "learning_rate": 4.986932715411239e-05, + "loss": 0.9765, + "step": 230 + }, + { + "epoch": 0.07, + "learning_rate": 4.985772830308771e-05, + "loss": 0.9755, + "step": 240 + }, + { + "epoch": 0.07, + "learning_rate": 4.9845637798619536e-05, + "loss": 0.9798, + "step": 250 + }, + { + "epoch": 0.07, + "learning_rate": 4.983305587984227e-05, + "loss": 0.9779, + "step": 260 + }, + { + "epoch": 0.08, + "learning_rate": 4.981998279560986e-05, + "loss": 0.9707, + "step": 270 + }, + { + "epoch": 0.08, + "learning_rate": 4.980641880449086e-05, + "loss": 0.987, + "step": 280 + }, + { + "epoch": 0.08, + "learning_rate": 4.9792364174763323e-05, + "loss": 0.9493, + "step": 290 + }, + { + "epoch": 0.08, + "learning_rate": 4.977781918440949e-05, + "loss": 0.9701, + "step": 300 + }, + { + "epoch": 0.09, + "learning_rate": 4.97627841211103e-05, + "loss": 0.9476, + "step": 310 + }, + { + "epoch": 0.09, + "learning_rate": 4.97472592822397e-05, + "loss": 0.9218, + "step": 320 + }, + { + "epoch": 0.09, + "learning_rate": 4.9731244974858746e-05, + "loss": 0.9481, + "step": 330 + }, + { + "epoch": 0.1, + "learning_rate": 4.971474151570955e-05, + "loss": 0.9508, + "step": 340 + }, + { + "epoch": 0.1, + "learning_rate": 4.9697749231209025e-05, + "loss": 0.9587, + "step": 350 + }, + { + "epoch": 0.1, + "learning_rate": 4.968026845744237e-05, + "loss": 0.9371, + "step": 360 + }, + { + "epoch": 0.1, + "learning_rate": 4.96622995401565e-05, + "loss": 0.9242, + "step": 370 + }, + { + "epoch": 0.11, + "learning_rate": 4.9643842834753174e-05, + "loss": 0.9229, + "step": 380 + }, + { + "epoch": 0.11, + "learning_rate": 4.962489870628193e-05, + "loss": 0.9271, + "step": 390 + }, + { + "epoch": 0.11, + "learning_rate": 4.960546752943294e-05, + "loss": 0.9309, + "step": 400 + }, + { + "epoch": 0.12, + "learning_rate": 4.958554968852952e-05, + "loss": 0.9102, + "step": 410 + }, + { + "epoch": 0.12, + "learning_rate": 4.95651455775206e-05, + "loss": 0.9089, + "step": 420 + }, + { + "epoch": 0.12, + "learning_rate": 4.954425559997287e-05, + "loss": 0.9236, + "step": 430 + }, + { + "epoch": 0.12, + "learning_rate": 4.952288016906284e-05, + "loss": 0.9184, + "step": 440 + }, + { + "epoch": 0.13, + "learning_rate": 4.9501019707568665e-05, + "loss": 0.9112, + "step": 450 + }, + { + "epoch": 0.13, + "learning_rate": 4.947867464786174e-05, + "loss": 0.9178, + "step": 460 + }, + { + "epoch": 0.13, + "learning_rate": 4.945584543189823e-05, + "loss": 0.9364, + "step": 470 + }, + { + "epoch": 0.14, + "learning_rate": 4.943253251121022e-05, + "loss": 0.9262, + "step": 480 + }, + { + "epoch": 0.14, + "learning_rate": 4.9408736346896894e-05, + "loss": 0.9037, + "step": 490 + }, + { + "epoch": 0.14, + "learning_rate": 4.938445740961534e-05, + "loss": 0.928, + "step": 500 + }, + { + "epoch": 0.14, + "learning_rate": 4.935969617957126e-05, + "loss": 0.9064, + "step": 510 + }, + { + "epoch": 0.15, + "learning_rate": 4.93344531465095e-05, + "loss": 0.9107, + "step": 520 + }, + { + "epoch": 0.15, + "learning_rate": 4.930872880970432e-05, + "loss": 0.905, + "step": 530 + }, + { + "epoch": 0.15, + "learning_rate": 4.9282523677949556e-05, + "loss": 0.9234, + "step": 540 + }, + { + "epoch": 0.16, + "learning_rate": 4.9255838269548524e-05, + "loss": 0.906, + "step": 550 + }, + { + "epoch": 0.16, + "learning_rate": 4.9228673112303814e-05, + "loss": 0.8885, + "step": 560 + }, + { + "epoch": 0.16, + "learning_rate": 4.9201028743506794e-05, + "loss": 0.9103, + "step": 570 + }, + { + "epoch": 0.16, + "learning_rate": 4.917290570992702e-05, + "loss": 0.895, + "step": 580 + }, + { + "epoch": 0.17, + "learning_rate": 4.9144304567801415e-05, + "loss": 0.8948, + "step": 590 + }, + { + "epoch": 0.17, + "learning_rate": 4.911522588282327e-05, + "loss": 0.9109, + "step": 600 + }, + { + "epoch": 0.17, + "learning_rate": 4.908567023013104e-05, + "loss": 0.8914, + "step": 610 + }, + { + "epoch": 0.18, + "learning_rate": 4.9055638194296994e-05, + "loss": 0.892, + "step": 620 + }, + { + "epoch": 0.18, + "learning_rate": 4.902513036931562e-05, + "loss": 0.9049, + "step": 630 + }, + { + "epoch": 0.18, + "learning_rate": 4.89941473585919e-05, + "loss": 0.904, + "step": 640 + }, + { + "epoch": 0.18, + "learning_rate": 4.89626897749294e-05, + "loss": 0.8983, + "step": 650 + }, + { + "epoch": 0.19, + "learning_rate": 4.893075824051807e-05, + "loss": 0.8884, + "step": 660 + }, + { + "epoch": 0.19, + "learning_rate": 4.889835338692201e-05, + "loss": 0.8886, + "step": 670 + }, + { + "epoch": 0.19, + "learning_rate": 4.886547585506698e-05, + "loss": 0.8998, + "step": 680 + }, + { + "epoch": 0.2, + "learning_rate": 4.8832126295227656e-05, + "loss": 0.8753, + "step": 690 + }, + { + "epoch": 0.2, + "learning_rate": 4.879830536701485e-05, + "loss": 0.8937, + "step": 700 + }, + { + "epoch": 0.2, + "learning_rate": 4.876401373936239e-05, + "loss": 0.8921, + "step": 710 + }, + { + "epoch": 0.2, + "learning_rate": 4.8729252090513964e-05, + "loss": 0.8801, + "step": 720 + }, + { + "epoch": 0.21, + "learning_rate": 4.869402110800963e-05, + "loss": 0.8887, + "step": 730 + }, + { + "epoch": 0.21, + "learning_rate": 4.865832148867228e-05, + "loss": 0.8793, + "step": 740 + }, + { + "epoch": 0.21, + "learning_rate": 4.8622153938593816e-05, + "loss": 0.8811, + "step": 750 + }, + { + "epoch": 0.22, + "learning_rate": 4.8585519173121205e-05, + "loss": 0.8924, + "step": 760 + }, + { + "epoch": 0.22, + "learning_rate": 4.8548417916842324e-05, + "loss": 0.8988, + "step": 770 + }, + { + "epoch": 0.22, + "learning_rate": 4.851085090357163e-05, + "loss": 0.8907, + "step": 780 + }, + { + "epoch": 0.22, + "learning_rate": 4.847281887633565e-05, + "loss": 0.8879, + "step": 790 + }, + { + "epoch": 0.23, + "learning_rate": 4.843432258735827e-05, + "loss": 0.8796, + "step": 800 + }, + { + "epoch": 0.23, + "learning_rate": 4.839536279804589e-05, + "loss": 0.8965, + "step": 810 + }, + { + "epoch": 0.23, + "learning_rate": 4.835594027897231e-05, + "loss": 0.8678, + "step": 820 + }, + { + "epoch": 0.23, + "learning_rate": 4.831605580986355e-05, + "loss": 0.8857, + "step": 830 + }, + { + "epoch": 0.24, + "learning_rate": 4.8275710179582366e-05, + "loss": 0.8805, + "step": 840 + }, + { + "epoch": 0.24, + "learning_rate": 4.823490418611273e-05, + "loss": 0.865, + "step": 850 + }, + { + "epoch": 0.24, + "learning_rate": 4.819363863654395e-05, + "loss": 0.8892, + "step": 860 + }, + { + "epoch": 0.25, + "learning_rate": 4.8151914347054776e-05, + "loss": 0.8589, + "step": 870 + }, + { + "epoch": 0.25, + "learning_rate": 4.810973214289724e-05, + "loss": 0.8819, + "step": 880 + }, + { + "epoch": 0.25, + "learning_rate": 4.806709285838031e-05, + "loss": 0.8778, + "step": 890 + }, + { + "epoch": 0.25, + "learning_rate": 4.8023997336853434e-05, + "loss": 0.8725, + "step": 900 + }, + { + "epoch": 0.26, + "learning_rate": 4.7980446430689804e-05, + "loss": 0.8856, + "step": 910 + }, + { + "epoch": 0.26, + "learning_rate": 4.793644100126954e-05, + "loss": 0.8836, + "step": 920 + }, + { + "epoch": 0.26, + "learning_rate": 4.7891981918962656e-05, + "loss": 0.8684, + "step": 930 + }, + { + "epoch": 0.27, + "learning_rate": 4.784707006311179e-05, + "loss": 0.8671, + "step": 940 + }, + { + "epoch": 0.27, + "learning_rate": 4.780170632201487e-05, + "loss": 0.868, + "step": 950 + }, + { + "epoch": 0.27, + "learning_rate": 4.7755891592907556e-05, + "loss": 0.8683, + "step": 960 + }, + { + "epoch": 0.27, + "learning_rate": 4.7709626781945397e-05, + "loss": 0.8581, + "step": 970 + }, + { + "epoch": 0.28, + "learning_rate": 4.766291280418603e-05, + "loss": 0.8653, + "step": 980 + }, + { + "epoch": 0.28, + "learning_rate": 4.761575058357101e-05, + "loss": 0.8677, + "step": 990 + }, + { + "epoch": 0.28, + "learning_rate": 4.756814105290753e-05, + "loss": 0.8734, + "step": 1000 + }, + { + "epoch": 0.29, + "learning_rate": 4.7520085153850014e-05, + "loss": 0.8583, + "step": 1010 + }, + { + "epoch": 0.29, + "learning_rate": 4.7471583836881476e-05, + "loss": 0.874, + "step": 1020 + }, + { + "epoch": 0.29, + "learning_rate": 4.742263806129469e-05, + "loss": 0.8554, + "step": 1030 + }, + { + "epoch": 0.29, + "learning_rate": 4.737324879517326e-05, + "loss": 0.8807, + "step": 1040 + }, + { + "epoch": 0.3, + "learning_rate": 4.732341701537245e-05, + "loss": 0.8633, + "step": 1050 + }, + { + "epoch": 0.3, + "learning_rate": 4.727314370749988e-05, + "loss": 0.875, + "step": 1060 + }, + { + "epoch": 0.3, + "learning_rate": 4.7222429865896e-05, + "loss": 0.8709, + "step": 1070 + }, + { + "epoch": 0.31, + "learning_rate": 4.717127649361444e-05, + "loss": 0.8634, + "step": 1080 + }, + { + "epoch": 0.31, + "learning_rate": 4.71196846024022e-05, + "loss": 0.8566, + "step": 1090 + }, + { + "epoch": 0.31, + "learning_rate": 4.7067655212679585e-05, + "loss": 0.8667, + "step": 1100 + }, + { + "epoch": 0.31, + "learning_rate": 4.701518935352006e-05, + "loss": 0.8688, + "step": 1110 + }, + { + "epoch": 0.32, + "learning_rate": 4.69622880626299e-05, + "loss": 0.8573, + "step": 1120 + }, + { + "epoch": 0.32, + "learning_rate": 4.690895238632762e-05, + "loss": 0.8576, + "step": 1130 + }, + { + "epoch": 0.32, + "learning_rate": 4.685518337952335e-05, + "loss": 0.8525, + "step": 1140 + }, + { + "epoch": 0.33, + "learning_rate": 4.680098210569789e-05, + "loss": 0.8656, + "step": 1150 + }, + { + "epoch": 0.33, + "learning_rate": 4.674634963688177e-05, + "loss": 0.8703, + "step": 1160 + }, + { + "epoch": 0.33, + "learning_rate": 4.669128705363394e-05, + "loss": 0.8616, + "step": 1170 + }, + { + "epoch": 0.33, + "learning_rate": 4.663579544502049e-05, + "loss": 0.8677, + "step": 1180 + }, + { + "epoch": 0.34, + "learning_rate": 4.657987590859305e-05, + "loss": 0.8525, + "step": 1190 + }, + { + "epoch": 0.34, + "learning_rate": 4.652352955036713e-05, + "loss": 0.8526, + "step": 1200 + }, + { + "epoch": 0.34, + "learning_rate": 4.646675748480019e-05, + "loss": 0.8586, + "step": 1210 + }, + { + "epoch": 0.35, + "learning_rate": 4.640956083476964e-05, + "loss": 0.8542, + "step": 1220 + }, + { + "epoch": 0.35, + "learning_rate": 4.635194073155061e-05, + "loss": 0.8517, + "step": 1230 + }, + { + "epoch": 0.35, + "learning_rate": 4.62938983147936e-05, + "loss": 0.8592, + "step": 1240 + }, + { + "epoch": 0.35, + "learning_rate": 4.62354347325019e-05, + "loss": 0.8678, + "step": 1250 + }, + { + "epoch": 0.36, + "learning_rate": 4.6176551141008916e-05, + "loss": 0.8644, + "step": 1260 + }, + { + "epoch": 0.36, + "learning_rate": 4.611724870495528e-05, + "loss": 0.8541, + "step": 1270 + }, + { + "epoch": 0.36, + "learning_rate": 4.605752859726583e-05, + "loss": 0.8438, + "step": 1280 + }, + { + "epoch": 0.37, + "learning_rate": 4.5997391999126397e-05, + "loss": 0.8604, + "step": 1290 + }, + { + "epoch": 0.37, + "learning_rate": 4.5936840099960465e-05, + "loss": 0.8633, + "step": 1300 + }, + { + "epoch": 0.37, + "learning_rate": 4.587587409740561e-05, + "loss": 0.8437, + "step": 1310 + }, + { + "epoch": 0.37, + "learning_rate": 4.581449519728986e-05, + "loss": 0.8466, + "step": 1320 + }, + { + "epoch": 0.38, + "learning_rate": 4.575270461360779e-05, + "loss": 0.8457, + "step": 1330 + }, + { + "epoch": 0.38, + "learning_rate": 4.569050356849655e-05, + "loss": 0.8477, + "step": 1340 + }, + { + "epoch": 0.38, + "learning_rate": 4.562789329221169e-05, + "loss": 0.8608, + "step": 1350 + }, + { + "epoch": 0.39, + "learning_rate": 4.5564875023102796e-05, + "loss": 0.8555, + "step": 1360 + }, + { + "epoch": 0.39, + "learning_rate": 4.550145000758905e-05, + "loss": 0.8624, + "step": 1370 + }, + { + "epoch": 0.39, + "learning_rate": 4.543761950013453e-05, + "loss": 0.8613, + "step": 1380 + }, + { + "epoch": 0.39, + "learning_rate": 4.537338476322341e-05, + "loss": 0.849, + "step": 1390 + }, + { + "epoch": 0.4, + "learning_rate": 4.530874706733502e-05, + "loss": 0.858, + "step": 1400 + }, + { + "epoch": 0.4, + "learning_rate": 4.524370769091866e-05, + "loss": 0.8468, + "step": 1410 + }, + { + "epoch": 0.4, + "learning_rate": 4.5178267920368366e-05, + "loss": 0.8624, + "step": 1420 + }, + { + "epoch": 0.4, + "learning_rate": 4.511242904999746e-05, + "loss": 0.8464, + "step": 1430 + }, + { + "epoch": 0.41, + "learning_rate": 4.50461923820129e-05, + "loss": 0.8575, + "step": 1440 + }, + { + "epoch": 0.41, + "learning_rate": 4.497955922648961e-05, + "loss": 0.8587, + "step": 1450 + }, + { + "epoch": 0.41, + "learning_rate": 4.491253090134447e-05, + "loss": 0.8517, + "step": 1460 + }, + { + "epoch": 0.42, + "learning_rate": 4.4845108732310355e-05, + "loss": 0.8427, + "step": 1470 + }, + { + "epoch": 0.42, + "learning_rate": 4.4777294052909804e-05, + "loss": 0.8588, + "step": 1480 + }, + { + "epoch": 0.42, + "learning_rate": 4.470908820442873e-05, + "loss": 0.8516, + "step": 1490 + }, + { + "epoch": 0.42, + "learning_rate": 4.464049253588985e-05, + "loss": 0.8408, + "step": 1500 + }, + { + "epoch": 0.43, + "learning_rate": 4.457150840402604e-05, + "loss": 0.8513, + "step": 1510 + }, + { + "epoch": 0.43, + "learning_rate": 4.450213717325343e-05, + "loss": 0.8554, + "step": 1520 + }, + { + "epoch": 0.43, + "learning_rate": 4.443238021564448e-05, + "loss": 0.8598, + "step": 1530 + }, + { + "epoch": 0.44, + "learning_rate": 4.4362238910900835e-05, + "loss": 0.8495, + "step": 1540 + }, + { + "epoch": 0.44, + "learning_rate": 4.4291714646326024e-05, + "loss": 0.8338, + "step": 1550 + }, + { + "epoch": 0.44, + "learning_rate": 4.4220808816797995e-05, + "loss": 0.8576, + "step": 1560 + }, + { + "epoch": 0.44, + "learning_rate": 4.414952282474158e-05, + "loss": 0.8593, + "step": 1570 + }, + { + "epoch": 0.45, + "learning_rate": 4.407785808010073e-05, + "loss": 0.8534, + "step": 1580 + }, + { + "epoch": 0.45, + "learning_rate": 4.400581600031062e-05, + "loss": 0.8564, + "step": 1590 + }, + { + "epoch": 0.45, + "learning_rate": 4.3933398010269614e-05, + "loss": 0.8446, + "step": 1600 + }, + { + "epoch": 0.46, + "learning_rate": 4.386060554231111e-05, + "loss": 0.8445, + "step": 1610 + }, + { + "epoch": 0.46, + "learning_rate": 4.378744003617517e-05, + "loss": 0.8281, + "step": 1620 + }, + { + "epoch": 0.46, + "learning_rate": 4.371390293898007e-05, + "loss": 0.8449, + "step": 1630 + }, + { + "epoch": 0.46, + "learning_rate": 4.3639995705193684e-05, + "loss": 0.8405, + "step": 1640 + }, + { + "epoch": 0.47, + "learning_rate": 4.3565719796604706e-05, + "loss": 0.8349, + "step": 1650 + }, + { + "epoch": 0.47, + "learning_rate": 4.3491076682293715e-05, + "loss": 0.8311, + "step": 1660 + }, + { + "epoch": 0.47, + "learning_rate": 4.341606783860416e-05, + "loss": 0.8383, + "step": 1670 + }, + { + "epoch": 0.48, + "learning_rate": 4.334069474911313e-05, + "loss": 0.8313, + "step": 1680 + }, + { + "epoch": 0.48, + "learning_rate": 4.326495890460204e-05, + "loss": 0.8424, + "step": 1690 + }, + { + "epoch": 0.48, + "learning_rate": 4.3188861803027094e-05, + "loss": 0.8323, + "step": 1700 + }, + { + "epoch": 0.48, + "learning_rate": 4.3112404949489715e-05, + "loss": 0.8501, + "step": 1710 + }, + { + "epoch": 0.49, + "learning_rate": 4.303558985620673e-05, + "loss": 0.8399, + "step": 1720 + }, + { + "epoch": 0.49, + "learning_rate": 4.2958418042480506e-05, + "loss": 0.8184, + "step": 1730 + }, + { + "epoch": 0.49, + "learning_rate": 4.288089103466886e-05, + "loss": 0.8418, + "step": 1740 + }, + { + "epoch": 0.5, + "learning_rate": 4.280301036615489e-05, + "loss": 0.828, + "step": 1750 + }, + { + "epoch": 0.5, + "learning_rate": 4.272477757731662e-05, + "loss": 0.836, + "step": 1760 + }, + { + "epoch": 0.5, + "learning_rate": 4.2646194215496595e-05, + "loss": 0.825, + "step": 1770 + }, + { + "epoch": 0.5, + "learning_rate": 4.2567261834971206e-05, + "loss": 0.8357, + "step": 1780 + }, + { + "epoch": 0.51, + "learning_rate": 4.248798199691998e-05, + "loss": 0.8498, + "step": 1790 + }, + { + "epoch": 0.51, + "learning_rate": 4.2408356269394714e-05, + "loss": 0.8361, + "step": 1800 + }, + { + "epoch": 0.51, + "learning_rate": 4.2328386227288445e-05, + "loss": 0.8237, + "step": 1810 + }, + { + "epoch": 0.52, + "learning_rate": 4.224807345230429e-05, + "loss": 0.8413, + "step": 1820 + }, + { + "epoch": 0.52, + "learning_rate": 4.21674195329242e-05, + "loss": 0.823, + "step": 1830 + }, + { + "epoch": 0.52, + "learning_rate": 4.208642606437748e-05, + "loss": 0.8501, + "step": 1840 + }, + { + "epoch": 0.52, + "learning_rate": 4.2005094648609325e-05, + "loss": 0.8372, + "step": 1850 + }, + { + "epoch": 0.53, + "learning_rate": 4.192342689424903e-05, + "loss": 0.8072, + "step": 1860 + }, + { + "epoch": 0.53, + "learning_rate": 4.184142441657827e-05, + "loss": 0.8409, + "step": 1870 + }, + { + "epoch": 0.53, + "learning_rate": 4.1759088837499095e-05, + "loss": 0.856, + "step": 1880 + }, + { + "epoch": 0.54, + "learning_rate": 4.167642178550186e-05, + "loss": 0.8428, + "step": 1890 + }, + { + "epoch": 0.54, + "learning_rate": 4.159342489563304e-05, + "loss": 0.8344, + "step": 1900 + }, + { + "epoch": 0.54, + "learning_rate": 4.151009980946287e-05, + "loss": 0.8317, + "step": 1910 + }, + { + "epoch": 0.54, + "learning_rate": 4.142644817505284e-05, + "loss": 0.8172, + "step": 1920 + }, + { + "epoch": 0.55, + "learning_rate": 4.1342471646923196e-05, + "loss": 0.8305, + "step": 1930 + }, + { + "epoch": 0.55, + "learning_rate": 4.1258171886020124e-05, + "loss": 0.8303, + "step": 1940 + }, + { + "epoch": 0.55, + "learning_rate": 4.117355055968295e-05, + "loss": 0.8292, + "step": 1950 + }, + { + "epoch": 0.55, + "learning_rate": 4.1088609341611135e-05, + "loss": 0.8162, + "step": 1960 + }, + { + "epoch": 0.56, + "learning_rate": 4.1003349911831166e-05, + "loss": 0.8344, + "step": 1970 + }, + { + "epoch": 0.56, + "learning_rate": 4.091777395666338e-05, + "loss": 0.8545, + "step": 1980 + }, + { + "epoch": 0.56, + "learning_rate": 4.0831883168688534e-05, + "loss": 0.8305, + "step": 1990 + }, + { + "epoch": 0.57, + "learning_rate": 4.07456792467144e-05, + "loss": 0.8365, + "step": 2000 + }, + { + "epoch": 0.57, + "learning_rate": 4.065916389574211e-05, + "loss": 0.8375, + "step": 2010 + }, + { + "epoch": 0.57, + "learning_rate": 4.057233882693246e-05, + "loss": 0.8351, + "step": 2020 + }, + { + "epoch": 0.57, + "learning_rate": 4.048520575757207e-05, + "loss": 0.8165, + "step": 2030 + }, + { + "epoch": 0.58, + "learning_rate": 4.0397766411039395e-05, + "loss": 0.8194, + "step": 2040 + }, + { + "epoch": 0.58, + "learning_rate": 4.031002251677067e-05, + "loss": 0.8218, + "step": 2050 + }, + { + "epoch": 0.58, + "learning_rate": 4.022197581022567e-05, + "loss": 0.8203, + "step": 2060 + }, + { + "epoch": 0.59, + "learning_rate": 4.0133628032853435e-05, + "loss": 0.832, + "step": 2070 + }, + { + "epoch": 0.59, + "learning_rate": 4.004498093205773e-05, + "loss": 0.8066, + "step": 2080 + }, + { + "epoch": 0.59, + "learning_rate": 3.99560362611626e-05, + "loss": 0.8421, + "step": 2090 + }, + { + "epoch": 0.59, + "learning_rate": 3.986679577937762e-05, + "loss": 0.8217, + "step": 2100 + }, + { + "epoch": 0.6, + "learning_rate": 3.9777261251763145e-05, + "loss": 0.8268, + "step": 2110 + }, + { + "epoch": 0.6, + "learning_rate": 3.9687434449195316e-05, + "loss": 0.8321, + "step": 2120 + }, + { + "epoch": 0.6, + "learning_rate": 3.959731714833115e-05, + "loss": 0.8266, + "step": 2130 + }, + { + "epoch": 0.61, + "learning_rate": 3.95069111315733e-05, + "loss": 0.82, + "step": 2140 + }, + { + "epoch": 0.61, + "learning_rate": 3.9416218187034876e-05, + "loss": 0.8347, + "step": 2150 + }, + { + "epoch": 0.61, + "learning_rate": 3.9325240108504016e-05, + "loss": 0.8472, + "step": 2160 + }, + { + "epoch": 0.61, + "learning_rate": 3.923397869540845e-05, + "loss": 0.8092, + "step": 2170 + }, + { + "epoch": 0.62, + "learning_rate": 3.91424357527799e-05, + "loss": 0.8166, + "step": 2180 + }, + { + "epoch": 0.62, + "learning_rate": 3.905061309121837e-05, + "loss": 0.817, + "step": 2190 + }, + { + "epoch": 0.62, + "learning_rate": 3.895851252685634e-05, + "loss": 0.8073, + "step": 2200 + }, + { + "epoch": 0.63, + "learning_rate": 3.886613588132284e-05, + "loss": 0.8355, + "step": 2210 + }, + { + "epoch": 0.63, + "learning_rate": 3.877348498170743e-05, + "loss": 0.8232, + "step": 2220 + }, + { + "epoch": 0.63, + "learning_rate": 3.868056166052407e-05, + "loss": 0.8312, + "step": 2230 + }, + { + "epoch": 0.63, + "learning_rate": 3.858736775567484e-05, + "loss": 0.8215, + "step": 2240 + }, + { + "epoch": 0.64, + "learning_rate": 3.8493905110413626e-05, + "loss": 0.8263, + "step": 2250 + }, + { + "epoch": 0.64, + "learning_rate": 3.8400175573309646e-05, + "loss": 0.8282, + "step": 2260 + }, + { + "epoch": 0.64, + "learning_rate": 3.83061809982109e-05, + "loss": 0.8337, + "step": 2270 + }, + { + "epoch": 0.65, + "learning_rate": 3.821192324420747e-05, + "loss": 0.8291, + "step": 2280 + }, + { + "epoch": 0.65, + "learning_rate": 3.8117404175594795e-05, + "loss": 0.8444, + "step": 2290 + }, + { + "epoch": 0.65, + "learning_rate": 3.8022625661836775e-05, + "loss": 0.8063, + "step": 2300 + }, + { + "epoch": 0.65, + "learning_rate": 3.792758957752879e-05, + "loss": 0.825, + "step": 2310 + }, + { + "epoch": 0.66, + "learning_rate": 3.783229780236062e-05, + "loss": 0.8244, + "step": 2320 + }, + { + "epoch": 0.66, + "learning_rate": 3.773675222107929e-05, + "loss": 0.8086, + "step": 2330 + }, + { + "epoch": 0.66, + "learning_rate": 3.7640954723451784e-05, + "loss": 0.823, + "step": 2340 + }, + { + "epoch": 0.67, + "learning_rate": 3.7544907204227646e-05, + "loss": 0.8177, + "step": 2350 + }, + { + "epoch": 0.67, + "learning_rate": 3.7448611563101536e-05, + "loss": 0.8142, + "step": 2360 + }, + { + "epoch": 0.67, + "learning_rate": 3.735206970467564e-05, + "loss": 0.8236, + "step": 2370 + }, + { + "epoch": 0.67, + "learning_rate": 3.7255283538421984e-05, + "loss": 0.8169, + "step": 2380 + }, + { + "epoch": 0.68, + "learning_rate": 3.7158254978644703e-05, + "loss": 0.8143, + "step": 2390 + }, + { + "epoch": 0.68, + "learning_rate": 3.706098594444216e-05, + "loss": 0.8061, + "step": 2400 + }, + { + "epoch": 0.68, + "learning_rate": 3.6963478359668966e-05, + "loss": 0.8253, + "step": 2410 + }, + { + "epoch": 0.69, + "learning_rate": 3.6865734152897987e-05, + "loss": 0.812, + "step": 2420 + }, + { + "epoch": 0.69, + "learning_rate": 3.676775525738213e-05, + "loss": 0.8263, + "step": 2430 + }, + { + "epoch": 0.69, + "learning_rate": 3.666954361101616e-05, + "loss": 0.8144, + "step": 2440 + }, + { + "epoch": 0.69, + "learning_rate": 3.657110115629832e-05, + "loss": 0.8089, + "step": 2450 + }, + { + "epoch": 0.7, + "learning_rate": 3.647242984029201e-05, + "loss": 0.8155, + "step": 2460 + }, + { + "epoch": 0.7, + "learning_rate": 3.637353161458713e-05, + "loss": 0.8142, + "step": 2470 + }, + { + "epoch": 0.7, + "learning_rate": 3.627440843526158e-05, + "loss": 0.8192, + "step": 2480 + }, + { + "epoch": 0.7, + "learning_rate": 3.6175062262842585e-05, + "loss": 0.8134, + "step": 2490 + }, + { + "epoch": 0.71, + "learning_rate": 3.607549506226784e-05, + "loss": 0.8175, + "step": 2500 + }, + { + "epoch": 0.71, + "learning_rate": 3.5975708802846725e-05, + "loss": 0.8192, + "step": 2510 + }, + { + "epoch": 0.71, + "learning_rate": 3.587570545822128e-05, + "loss": 0.8348, + "step": 2520 + }, + { + "epoch": 0.72, + "learning_rate": 3.5775487006327215e-05, + "loss": 0.8147, + "step": 2530 + }, + { + "epoch": 0.72, + "learning_rate": 3.567505542935482e-05, + "loss": 0.8235, + "step": 2540 + }, + { + "epoch": 0.72, + "learning_rate": 3.557441271370968e-05, + "loss": 0.8175, + "step": 2550 + }, + { + "epoch": 0.72, + "learning_rate": 3.547356084997344e-05, + "loss": 0.8197, + "step": 2560 + }, + { + "epoch": 0.73, + "learning_rate": 3.537250183286443e-05, + "loss": 0.808, + "step": 2570 + }, + { + "epoch": 0.73, + "learning_rate": 3.527123766119818e-05, + "loss": 0.8154, + "step": 2580 + }, + { + "epoch": 0.73, + "learning_rate": 3.5169770337847935e-05, + "loss": 0.8104, + "step": 2590 + }, + { + "epoch": 0.74, + "learning_rate": 3.5068101869705004e-05, + "loss": 0.8318, + "step": 2600 + }, + { + "epoch": 0.74, + "learning_rate": 3.496623426763908e-05, + "loss": 0.8146, + "step": 2610 + }, + { + "epoch": 0.74, + "learning_rate": 3.486416954645846e-05, + "loss": 0.8097, + "step": 2620 + }, + { + "epoch": 0.74, + "learning_rate": 3.4761909724870205e-05, + "loss": 0.8176, + "step": 2630 + }, + { + "epoch": 0.75, + "learning_rate": 3.4659456825440216e-05, + "loss": 0.8284, + "step": 2640 + }, + { + "epoch": 0.75, + "learning_rate": 3.4556812874553204e-05, + "loss": 0.8159, + "step": 2650 + }, + { + "epoch": 0.75, + "learning_rate": 3.445397990237264e-05, + "loss": 0.8204, + "step": 2660 + }, + { + "epoch": 0.76, + "learning_rate": 3.4350959942800584e-05, + "loss": 0.8013, + "step": 2670 + }, + { + "epoch": 0.76, + "learning_rate": 3.424775503343747e-05, + "loss": 0.8196, + "step": 2680 + }, + { + "epoch": 0.76, + "learning_rate": 3.414436721554179e-05, + "loss": 0.802, + "step": 2690 + }, + { + "epoch": 0.76, + "learning_rate": 3.4040798533989745e-05, + "loss": 0.8204, + "step": 2700 + }, + { + "epoch": 0.77, + "learning_rate": 3.3937051037234745e-05, + "loss": 0.8055, + "step": 2710 + }, + { + "epoch": 0.77, + "learning_rate": 3.3833126777266974e-05, + "loss": 0.8171, + "step": 2720 + }, + { + "epoch": 0.77, + "learning_rate": 3.3729027809572735e-05, + "loss": 0.8222, + "step": 2730 + }, + { + "epoch": 0.78, + "learning_rate": 3.3624756193093835e-05, + "loss": 0.8104, + "step": 2740 + }, + { + "epoch": 0.78, + "learning_rate": 3.3520313990186856e-05, + "loss": 0.8147, + "step": 2750 + }, + { + "epoch": 0.78, + "learning_rate": 3.341570326658232e-05, + "loss": 0.8017, + "step": 2760 + }, + { + "epoch": 0.78, + "learning_rate": 3.331092609134392e-05, + "loss": 0.8059, + "step": 2770 + }, + { + "epoch": 0.79, + "learning_rate": 3.32059845368275e-05, + "loss": 0.8204, + "step": 2780 + }, + { + "epoch": 0.79, + "learning_rate": 3.310088067864015e-05, + "loss": 0.812, + "step": 2790 + }, + { + "epoch": 0.79, + "learning_rate": 3.299561659559909e-05, + "loss": 0.8087, + "step": 2800 + }, + { + "epoch": 0.8, + "learning_rate": 3.289019436969057e-05, + "loss": 0.8038, + "step": 2810 + }, + { + "epoch": 0.8, + "learning_rate": 3.278461608602873e-05, + "loss": 0.8094, + "step": 2820 + }, + { + "epoch": 0.8, + "learning_rate": 3.267888383281431e-05, + "loss": 0.8182, + "step": 2830 + }, + { + "epoch": 0.8, + "learning_rate": 3.257299970129336e-05, + "loss": 0.812, + "step": 2840 + }, + { + "epoch": 0.81, + "learning_rate": 3.246696578571592e-05, + "loss": 0.809, + "step": 2850 + }, + { + "epoch": 0.81, + "learning_rate": 3.236078418329452e-05, + "loss": 0.8288, + "step": 2860 + }, + { + "epoch": 0.81, + "learning_rate": 3.225445699416276e-05, + "loss": 0.808, + "step": 2870 + }, + { + "epoch": 0.82, + "learning_rate": 3.214798632133376e-05, + "loss": 0.8127, + "step": 2880 + }, + { + "epoch": 0.82, + "learning_rate": 3.204137427065857e-05, + "loss": 0.8159, + "step": 2890 + }, + { + "epoch": 0.82, + "learning_rate": 3.193462295078448e-05, + "loss": 0.819, + "step": 2900 + }, + { + "epoch": 0.82, + "learning_rate": 3.1827734473113356e-05, + "loss": 0.8108, + "step": 2910 + }, + { + "epoch": 0.83, + "learning_rate": 3.172071095175989e-05, + "loss": 0.8199, + "step": 2920 + }, + { + "epoch": 0.83, + "learning_rate": 3.1613554503509715e-05, + "loss": 0.7977, + "step": 2930 + }, + { + "epoch": 0.83, + "learning_rate": 3.1506267247777645e-05, + "loss": 0.8171, + "step": 2940 + }, + { + "epoch": 0.84, + "learning_rate": 3.139885130656563e-05, + "loss": 0.8064, + "step": 2950 + }, + { + "epoch": 0.84, + "learning_rate": 3.129130880442091e-05, + "loss": 0.8087, + "step": 2960 + }, + { + "epoch": 0.84, + "learning_rate": 3.118364186839389e-05, + "loss": 0.8023, + "step": 2970 + }, + { + "epoch": 0.84, + "learning_rate": 3.107585262799613e-05, + "loss": 0.7978, + "step": 2980 + }, + { + "epoch": 0.85, + "learning_rate": 3.096794321515823e-05, + "loss": 0.8268, + "step": 2990 + }, + { + "epoch": 0.85, + "learning_rate": 3.0859915764187616e-05, + "loss": 0.8129, + "step": 3000 + }, + { + "epoch": 0.85, + "learning_rate": 3.075177241172637e-05, + "loss": 0.8121, + "step": 3010 + }, + { + "epoch": 0.86, + "learning_rate": 3.064351529670895e-05, + "loss": 0.8018, + "step": 3020 + }, + { + "epoch": 0.86, + "learning_rate": 3.0535146560319895e-05, + "loss": 0.8191, + "step": 3030 + }, + { + "epoch": 0.86, + "learning_rate": 3.0426668345951448e-05, + "loss": 0.813, + "step": 3040 + }, + { + "epoch": 0.86, + "learning_rate": 3.031808279916121e-05, + "loss": 0.8252, + "step": 3050 + }, + { + "epoch": 0.87, + "learning_rate": 3.0209392067629676e-05, + "loss": 0.7995, + "step": 3060 + }, + { + "epoch": 0.87, + "learning_rate": 3.010059830111773e-05, + "loss": 0.8162, + "step": 3070 + }, + { + "epoch": 0.87, + "learning_rate": 2.9991703651424184e-05, + "loss": 0.8175, + "step": 3080 + }, + { + "epoch": 0.87, + "learning_rate": 2.988271027234317e-05, + "loss": 0.8076, + "step": 3090 + }, + { + "epoch": 0.88, + "learning_rate": 2.977362031962158e-05, + "loss": 0.8063, + "step": 3100 + }, + { + "epoch": 0.88, + "learning_rate": 2.966443595091637e-05, + "loss": 0.8159, + "step": 3110 + }, + { + "epoch": 0.88, + "learning_rate": 2.9555159325751947e-05, + "loss": 0.8083, + "step": 3120 + }, + { + "epoch": 0.89, + "learning_rate": 2.9445792605477433e-05, + "loss": 0.807, + "step": 3130 + }, + { + "epoch": 0.89, + "learning_rate": 2.933633795322391e-05, + "loss": 0.8123, + "step": 3140 + }, + { + "epoch": 0.89, + "learning_rate": 2.9226797533861615e-05, + "loss": 0.8107, + "step": 3150 + }, + { + "epoch": 0.89, + "learning_rate": 2.9117173513957186e-05, + "loss": 0.8053, + "step": 3160 + }, + { + "epoch": 0.9, + "learning_rate": 2.900746806173074e-05, + "loss": 0.8068, + "step": 3170 + }, + { + "epoch": 0.9, + "learning_rate": 2.889768334701305e-05, + "loss": 0.8086, + "step": 3180 + }, + { + "epoch": 0.9, + "learning_rate": 2.8787821541202564e-05, + "loss": 0.8042, + "step": 3190 + }, + { + "epoch": 0.91, + "learning_rate": 2.8677884817222505e-05, + "loss": 0.8019, + "step": 3200 + }, + { + "epoch": 0.91, + "learning_rate": 2.856787534947789e-05, + "loss": 0.8117, + "step": 3210 + }, + { + "epoch": 0.91, + "learning_rate": 2.8457795313812507e-05, + "loss": 0.8243, + "step": 3220 + }, + { + "epoch": 0.91, + "learning_rate": 2.8347646887465867e-05, + "loss": 0.7953, + "step": 3230 + }, + { + "epoch": 0.92, + "learning_rate": 2.8237432249030183e-05, + "loss": 0.8042, + "step": 3240 + }, + { + "epoch": 0.92, + "learning_rate": 2.812715357840725e-05, + "loss": 0.799, + "step": 3250 + }, + { + "epoch": 0.92, + "learning_rate": 2.801681305676534e-05, + "loss": 0.8093, + "step": 3260 + }, + { + "epoch": 0.93, + "learning_rate": 2.7906412866496034e-05, + "loss": 0.8048, + "step": 3270 + }, + { + "epoch": 0.93, + "learning_rate": 2.7795955191171114e-05, + "loss": 0.8116, + "step": 3280 + }, + { + "epoch": 0.93, + "learning_rate": 2.7685442215499323e-05, + "loss": 0.8151, + "step": 3290 + }, + { + "epoch": 0.93, + "learning_rate": 2.7574876125283176e-05, + "loss": 0.8017, + "step": 3300 + }, + { + "epoch": 0.94, + "learning_rate": 2.7464259107375722e-05, + "loss": 0.8051, + "step": 3310 + }, + { + "epoch": 0.94, + "learning_rate": 2.7353593349637297e-05, + "loss": 0.803, + "step": 3320 + }, + { + "epoch": 0.94, + "learning_rate": 2.7242881040892255e-05, + "loss": 0.8094, + "step": 3330 + }, + { + "epoch": 0.95, + "learning_rate": 2.713212437088564e-05, + "loss": 0.8186, + "step": 3340 + }, + { + "epoch": 0.95, + "learning_rate": 2.702132553023993e-05, + "loss": 0.8041, + "step": 3350 + }, + { + "epoch": 0.95, + "learning_rate": 2.691048671041169e-05, + "loss": 0.8009, + "step": 3360 + }, + { + "epoch": 0.95, + "learning_rate": 2.6799610103648197e-05, + "loss": 0.7931, + "step": 3370 + }, + { + "epoch": 0.96, + "learning_rate": 2.668869790294411e-05, + "loss": 0.8001, + "step": 3380 + }, + { + "epoch": 0.96, + "learning_rate": 2.6577752301998098e-05, + "loss": 0.8167, + "step": 3390 + }, + { + "epoch": 0.96, + "learning_rate": 2.6466775495169437e-05, + "loss": 0.8114, + "step": 3400 + }, + { + "epoch": 0.97, + "learning_rate": 2.6355769677434628e-05, + "loss": 0.8026, + "step": 3410 + }, + { + "epoch": 0.97, + "learning_rate": 2.6244737044343954e-05, + "loss": 0.8063, + "step": 3420 + }, + { + "epoch": 0.97, + "learning_rate": 2.6133679791978065e-05, + "loss": 0.8087, + "step": 3430 + }, + { + "epoch": 0.97, + "learning_rate": 2.602260011690457e-05, + "loss": 0.812, + "step": 3440 + }, + { + "epoch": 0.98, + "learning_rate": 2.591150021613456e-05, + "loss": 0.7899, + "step": 3450 + }, + { + "epoch": 0.98, + "learning_rate": 2.580038228707916e-05, + "loss": 0.798, + "step": 3460 + }, + { + "epoch": 0.98, + "learning_rate": 2.568924852750607e-05, + "loss": 0.826, + "step": 3470 + }, + { + "epoch": 0.99, + "learning_rate": 2.55781011354961e-05, + "loss": 0.8111, + "step": 3480 + }, + { + "epoch": 0.99, + "learning_rate": 2.5466942309399706e-05, + "loss": 0.7924, + "step": 3490 + }, + { + "epoch": 0.99, + "learning_rate": 2.535577424779347e-05, + "loss": 0.8001, + "step": 3500 + }, + { + "epoch": 0.99, + "learning_rate": 2.5244599149436642e-05, + "loss": 0.7906, + "step": 3510 + }, + { + "epoch": 1.0, + "learning_rate": 2.5133419213227684e-05, + "loss": 0.804, + "step": 3520 + }, + { + "epoch": 1.0, + "learning_rate": 2.5022236638160712e-05, + "loss": 0.8123, + "step": 3530 + }, + { + "epoch": 1.0, + "learning_rate": 2.491105362328204e-05, + "loss": 0.8164, + "step": 3540 + }, + { + "epoch": 1.01, + "learning_rate": 2.4799872367646685e-05, + "loss": 0.8169, + "step": 3550 + }, + { + "epoch": 1.01, + "learning_rate": 2.468869507027486e-05, + "loss": 0.7835, + "step": 3560 + }, + { + "epoch": 1.01, + "learning_rate": 2.457752393010851e-05, + "loss": 0.8199, + "step": 3570 + }, + { + "epoch": 1.01, + "learning_rate": 2.4466361145967782e-05, + "loss": 0.8096, + "step": 3580 + }, + { + "epoch": 1.02, + "learning_rate": 2.4355208916507554e-05, + "loss": 0.7792, + "step": 3590 + }, + { + "epoch": 1.02, + "learning_rate": 2.4244069440173938e-05, + "loss": 0.7789, + "step": 3600 + }, + { + "epoch": 1.02, + "learning_rate": 2.413294491516083e-05, + "loss": 0.8127, + "step": 3610 + }, + { + "epoch": 1.02, + "learning_rate": 2.402183753936639e-05, + "loss": 0.816, + "step": 3620 + }, + { + "epoch": 1.03, + "learning_rate": 2.3910749510349574e-05, + "loss": 0.8045, + "step": 3630 + }, + { + "epoch": 1.03, + "learning_rate": 2.3799683025286727e-05, + "loss": 0.8065, + "step": 3640 + }, + { + "epoch": 1.03, + "learning_rate": 2.3688640280928043e-05, + "loss": 0.8016, + "step": 3650 + }, + { + "epoch": 1.04, + "learning_rate": 2.357762347355418e-05, + "loss": 0.7902, + "step": 3660 + }, + { + "epoch": 1.04, + "learning_rate": 2.346663479893277e-05, + "loss": 0.8044, + "step": 3670 + }, + { + "epoch": 1.04, + "learning_rate": 2.3355676452275057e-05, + "loss": 0.8136, + "step": 3680 + }, + { + "epoch": 1.04, + "learning_rate": 2.3244750628192395e-05, + "loss": 0.7885, + "step": 3690 + }, + { + "epoch": 1.05, + "learning_rate": 2.313385952065291e-05, + "loss": 0.7734, + "step": 3700 + }, + { + "epoch": 1.05, + "learning_rate": 2.302300532293806e-05, + "loss": 0.8117, + "step": 3710 + }, + { + "epoch": 1.05, + "learning_rate": 2.2912190227599305e-05, + "loss": 0.7969, + "step": 3720 + }, + { + "epoch": 1.06, + "learning_rate": 2.280141642641468e-05, + "loss": 0.7741, + "step": 3730 + }, + { + "epoch": 1.06, + "learning_rate": 2.26906861103455e-05, + "loss": 0.7996, + "step": 3740 + }, + { + "epoch": 1.06, + "learning_rate": 2.2580001469492968e-05, + "loss": 0.806, + "step": 3750 + }, + { + "epoch": 1.06, + "learning_rate": 2.2469364693054938e-05, + "loss": 0.7969, + "step": 3760 + }, + { + "epoch": 1.07, + "learning_rate": 2.235877796928252e-05, + "loss": 0.8017, + "step": 3770 + }, + { + "epoch": 1.07, + "learning_rate": 2.2248243485436892e-05, + "loss": 0.8066, + "step": 3780 + }, + { + "epoch": 1.07, + "learning_rate": 2.213776342774595e-05, + "loss": 0.7969, + "step": 3790 + }, + { + "epoch": 1.08, + "learning_rate": 2.2027339981361156e-05, + "loss": 0.8008, + "step": 3800 + }, + { + "epoch": 1.08, + "learning_rate": 2.1916975330314235e-05, + "loss": 0.8111, + "step": 3810 + }, + { + "epoch": 1.08, + "learning_rate": 2.1806671657474048e-05, + "loss": 0.7797, + "step": 3820 + }, + { + "epoch": 1.08, + "learning_rate": 2.1696431144503356e-05, + "loss": 0.8016, + "step": 3830 + }, + { + "epoch": 1.09, + "learning_rate": 2.1586255971815738e-05, + "loss": 0.7962, + "step": 3840 + }, + { + "epoch": 1.09, + "learning_rate": 2.147614831853239e-05, + "loss": 0.7897, + "step": 3850 + }, + { + "epoch": 1.09, + "learning_rate": 2.136611036243908e-05, + "loss": 0.7951, + "step": 3860 + }, + { + "epoch": 1.1, + "learning_rate": 2.1256144279943066e-05, + "loss": 0.7856, + "step": 3870 + }, + { + "epoch": 1.1, + "learning_rate": 2.114625224603002e-05, + "loss": 0.7823, + "step": 3880 + }, + { + "epoch": 1.1, + "learning_rate": 2.1036436434221048e-05, + "loss": 0.8101, + "step": 3890 + }, + { + "epoch": 1.1, + "learning_rate": 2.0926699016529656e-05, + "loss": 0.7789, + "step": 3900 + }, + { + "epoch": 1.11, + "learning_rate": 2.0817042163418858e-05, + "loss": 0.7993, + "step": 3910 + }, + { + "epoch": 1.11, + "learning_rate": 2.0707468043758156e-05, + "loss": 0.8107, + "step": 3920 + }, + { + "epoch": 1.11, + "learning_rate": 2.059797882478074e-05, + "loss": 0.8005, + "step": 3930 + }, + { + "epoch": 1.12, + "learning_rate": 2.048857667204053e-05, + "loss": 0.8144, + "step": 3940 + }, + { + "epoch": 1.12, + "learning_rate": 2.0379263749369434e-05, + "loss": 0.7894, + "step": 3950 + }, + { + "epoch": 1.12, + "learning_rate": 2.027004221883447e-05, + "loss": 0.7763, + "step": 3960 + }, + { + "epoch": 1.12, + "learning_rate": 2.016091424069506e-05, + "loss": 0.781, + "step": 3970 + }, + { + "epoch": 1.13, + "learning_rate": 2.0051881973360266e-05, + "loss": 0.7878, + "step": 3980 + }, + { + "epoch": 1.13, + "learning_rate": 1.9942947573346133e-05, + "loss": 0.7956, + "step": 3990 + }, + { + "epoch": 1.13, + "learning_rate": 1.9834113195233e-05, + "loss": 0.8036, + "step": 4000 + }, + { + "epoch": 1.14, + "learning_rate": 1.9725380991622923e-05, + "loss": 0.7945, + "step": 4010 + }, + { + "epoch": 1.14, + "learning_rate": 1.961675311309705e-05, + "loss": 0.7955, + "step": 4020 + }, + { + "epoch": 1.14, + "learning_rate": 1.9508231708173146e-05, + "loss": 0.7772, + "step": 4030 + }, + { + "epoch": 1.14, + "learning_rate": 1.9399818923263056e-05, + "loss": 0.7805, + "step": 4040 + }, + { + "epoch": 1.15, + "learning_rate": 1.929151690263026e-05, + "loss": 0.798, + "step": 4050 + }, + { + "epoch": 1.15, + "learning_rate": 1.918332778834745e-05, + "loss": 0.8183, + "step": 4060 + }, + { + "epoch": 1.15, + "learning_rate": 1.9075253720254217e-05, + "loss": 0.8106, + "step": 4070 + }, + { + "epoch": 1.16, + "learning_rate": 1.8967296835914643e-05, + "loss": 0.7918, + "step": 4080 + }, + { + "epoch": 1.16, + "learning_rate": 1.885945927057511e-05, + "loss": 0.779, + "step": 4090 + }, + { + "epoch": 1.16, + "learning_rate": 1.8751743157122003e-05, + "loss": 0.7881, + "step": 4100 + }, + { + "epoch": 1.16, + "learning_rate": 1.8644150626039534e-05, + "loss": 0.7952, + "step": 4110 + }, + { + "epoch": 1.17, + "learning_rate": 1.8536683805367656e-05, + "loss": 0.7971, + "step": 4120 + }, + { + "epoch": 1.17, + "learning_rate": 1.8429344820659892e-05, + "loss": 0.8005, + "step": 4130 + }, + { + "epoch": 1.17, + "learning_rate": 1.832213579494137e-05, + "loss": 0.8014, + "step": 4140 + }, + { + "epoch": 1.17, + "learning_rate": 1.8215058848666765e-05, + "loss": 0.7883, + "step": 4150 + }, + { + "epoch": 1.18, + "learning_rate": 1.810811609967844e-05, + "loss": 0.7887, + "step": 4160 + }, + { + "epoch": 1.18, + "learning_rate": 1.8001309663164457e-05, + "loss": 0.7719, + "step": 4170 + }, + { + "epoch": 1.18, + "learning_rate": 1.7894641651616838e-05, + "loss": 0.8098, + "step": 4180 + }, + { + "epoch": 1.19, + "learning_rate": 1.7788114174789706e-05, + "loss": 0.7909, + "step": 4190 + }, + { + "epoch": 1.19, + "learning_rate": 1.7681729339657626e-05, + "loss": 0.7791, + "step": 4200 + }, + { + "epoch": 1.19, + "learning_rate": 1.7575489250373867e-05, + "loss": 0.7946, + "step": 4210 + }, + { + "epoch": 1.19, + "learning_rate": 1.746939600822883e-05, + "loss": 0.7973, + "step": 4220 + }, + { + "epoch": 1.2, + "learning_rate": 1.7363451711608445e-05, + "loss": 0.7961, + "step": 4230 + }, + { + "epoch": 1.2, + "learning_rate": 1.7257658455952747e-05, + "loss": 0.797, + "step": 4240 + }, + { + "epoch": 1.2, + "learning_rate": 1.715201833371432e-05, + "loss": 0.7961, + "step": 4250 + }, + { + "epoch": 1.21, + "learning_rate": 1.7046533434317008e-05, + "loss": 0.7918, + "step": 4260 + }, + { + "epoch": 1.21, + "learning_rate": 1.6941205844114522e-05, + "loss": 0.7868, + "step": 4270 + }, + { + "epoch": 1.21, + "learning_rate": 1.683603764634923e-05, + "loss": 0.7843, + "step": 4280 + }, + { + "epoch": 1.21, + "learning_rate": 1.6731030921110903e-05, + "loss": 0.7968, + "step": 4290 + }, + { + "epoch": 1.22, + "learning_rate": 1.6626187745295608e-05, + "loss": 0.7917, + "step": 4300 + }, + { + "epoch": 1.22, + "learning_rate": 1.65215101925646e-05, + "loss": 0.7872, + "step": 4310 + }, + { + "epoch": 1.22, + "learning_rate": 1.641700033330336e-05, + "loss": 0.777, + "step": 4320 + }, + { + "epoch": 1.23, + "learning_rate": 1.6312660234580585e-05, + "loss": 0.8049, + "step": 4330 + }, + { + "epoch": 1.23, + "learning_rate": 1.6208491960107324e-05, + "loss": 0.7897, + "step": 4340 + }, + { + "epoch": 1.23, + "learning_rate": 1.6104497570196193e-05, + "loss": 0.792, + "step": 4350 + }, + { + "epoch": 1.23, + "learning_rate": 1.600067912172057e-05, + "loss": 0.7866, + "step": 4360 + }, + { + "epoch": 1.24, + "learning_rate": 1.5897038668073965e-05, + "loss": 0.8061, + "step": 4370 + }, + { + "epoch": 1.24, + "learning_rate": 1.5793578259129355e-05, + "loss": 0.777, + "step": 4380 + }, + { + "epoch": 1.24, + "learning_rate": 1.5690299941198706e-05, + "loss": 0.7883, + "step": 4390 + }, + { + "epoch": 1.25, + "learning_rate": 1.558720575699242e-05, + "loss": 0.7897, + "step": 4400 + }, + { + "epoch": 1.25, + "learning_rate": 1.548429774557901e-05, + "loss": 0.8014, + "step": 4410 + }, + { + "epoch": 1.25, + "learning_rate": 1.5381577942344688e-05, + "loss": 0.7882, + "step": 4420 + }, + { + "epoch": 1.25, + "learning_rate": 1.5279048378953222e-05, + "loss": 0.7839, + "step": 4430 + }, + { + "epoch": 1.26, + "learning_rate": 1.517671108330561e-05, + "loss": 0.794, + "step": 4440 + }, + { + "epoch": 1.26, + "learning_rate": 1.5074568079500109e-05, + "loss": 0.7739, + "step": 4450 + }, + { + "epoch": 1.26, + "learning_rate": 1.497262138779208e-05, + "loss": 0.7911, + "step": 4460 + }, + { + "epoch": 1.27, + "learning_rate": 1.4870873024554138e-05, + "loss": 0.7907, + "step": 4470 + }, + { + "epoch": 1.27, + "learning_rate": 1.4769325002236183e-05, + "loss": 0.803, + "step": 4480 + }, + { + "epoch": 1.27, + "learning_rate": 1.4667979329325651e-05, + "loss": 0.8048, + "step": 4490 + }, + { + "epoch": 1.27, + "learning_rate": 1.4566838010307754e-05, + "loss": 0.7816, + "step": 4500 + }, + { + "epoch": 1.28, + "learning_rate": 1.4465903045625878e-05, + "loss": 0.7765, + "step": 4510 + }, + { + "epoch": 1.28, + "learning_rate": 1.4365176431641958e-05, + "loss": 0.7916, + "step": 4520 + }, + { + "epoch": 1.28, + "learning_rate": 1.4264660160597057e-05, + "loss": 0.8015, + "step": 4530 + }, + { + "epoch": 1.29, + "learning_rate": 1.41643562205719e-05, + "loss": 0.7826, + "step": 4540 + }, + { + "epoch": 1.29, + "learning_rate": 1.4064266595447584e-05, + "loss": 0.7834, + "step": 4550 + }, + { + "epoch": 1.29, + "learning_rate": 1.3964393264866368e-05, + "loss": 0.7873, + "step": 4560 + }, + { + "epoch": 1.29, + "learning_rate": 1.386473820419244e-05, + "loss": 0.8033, + "step": 4570 + }, + { + "epoch": 1.3, + "learning_rate": 1.376530338447294e-05, + "loss": 0.7973, + "step": 4580 + }, + { + "epoch": 1.3, + "learning_rate": 1.366609077239889e-05, + "loss": 0.7736, + "step": 4590 + }, + { + "epoch": 1.3, + "learning_rate": 1.3567102330266369e-05, + "loss": 0.7968, + "step": 4600 + }, + { + "epoch": 1.31, + "learning_rate": 1.3468340015937642e-05, + "loss": 0.7773, + "step": 4610 + }, + { + "epoch": 1.31, + "learning_rate": 1.3369805782802467e-05, + "loss": 0.7971, + "step": 4620 + }, + { + "epoch": 1.31, + "learning_rate": 1.3271501579739449e-05, + "loss": 0.7808, + "step": 4630 + }, + { + "epoch": 1.31, + "learning_rate": 1.317342935107752e-05, + "loss": 0.7826, + "step": 4640 + }, + { + "epoch": 1.32, + "learning_rate": 1.307559103655743e-05, + "loss": 0.7767, + "step": 4650 + }, + { + "epoch": 1.32, + "learning_rate": 1.2977988571293447e-05, + "loss": 0.7962, + "step": 4660 + }, + { + "epoch": 1.32, + "learning_rate": 1.288062388573501e-05, + "loss": 0.7876, + "step": 4670 + }, + { + "epoch": 1.33, + "learning_rate": 1.2783498905628622e-05, + "loss": 0.782, + "step": 4680 + }, + { + "epoch": 1.33, + "learning_rate": 1.2686615551979702e-05, + "loss": 0.7926, + "step": 4690 + }, + { + "epoch": 1.33, + "learning_rate": 1.2589975741014615e-05, + "loss": 0.7939, + "step": 4700 + }, + { + "epoch": 1.33, + "learning_rate": 1.2493581384142767e-05, + "loss": 0.7992, + "step": 4710 + }, + { + "epoch": 1.34, + "learning_rate": 1.2397434387918824e-05, + "loss": 0.7766, + "step": 4720 + }, + { + "epoch": 1.34, + "learning_rate": 1.2301536654004948e-05, + "loss": 0.7887, + "step": 4730 + }, + { + "epoch": 1.34, + "learning_rate": 1.2205890079133252e-05, + "loss": 0.7927, + "step": 4740 + }, + { + "epoch": 1.34, + "learning_rate": 1.2110496555068218e-05, + "loss": 0.786, + "step": 4750 + }, + { + "epoch": 1.35, + "learning_rate": 1.2015357968569335e-05, + "loss": 0.7821, + "step": 4760 + }, + { + "epoch": 1.35, + "learning_rate": 1.1920476201353763e-05, + "loss": 0.7864, + "step": 4770 + }, + { + "epoch": 1.35, + "learning_rate": 1.1825853130059098e-05, + "loss": 0.7888, + "step": 4780 + }, + { + "epoch": 1.36, + "learning_rate": 1.1731490626206263e-05, + "loss": 0.794, + "step": 4790 + }, + { + "epoch": 1.36, + "learning_rate": 1.16373905561625e-05, + "loss": 0.771, + "step": 4800 + }, + { + "epoch": 1.36, + "learning_rate": 1.1543554781104477e-05, + "loss": 0.7984, + "step": 4810 + }, + { + "epoch": 1.36, + "learning_rate": 1.1449985156981413e-05, + "loss": 0.7961, + "step": 4820 + }, + { + "epoch": 1.37, + "learning_rate": 1.1356683534478451e-05, + "loss": 0.7824, + "step": 4830 + }, + { + "epoch": 1.37, + "learning_rate": 1.1263651758979967e-05, + "loss": 0.7867, + "step": 4840 + }, + { + "epoch": 1.37, + "learning_rate": 1.1170891670533162e-05, + "loss": 0.787, + "step": 4850 + }, + { + "epoch": 1.38, + "learning_rate": 1.107840510381158e-05, + "loss": 0.7789, + "step": 4860 + }, + { + "epoch": 1.38, + "learning_rate": 1.0986193888078882e-05, + "loss": 0.7951, + "step": 4870 + }, + { + "epoch": 1.38, + "learning_rate": 1.0894259847152636e-05, + "loss": 0.8037, + "step": 4880 + }, + { + "epoch": 1.38, + "learning_rate": 1.0802604799368274e-05, + "loss": 0.7901, + "step": 4890 + }, + { + "epoch": 1.39, + "learning_rate": 1.0711230557543078e-05, + "loss": 0.7736, + "step": 4900 + }, + { + "epoch": 1.39, + "learning_rate": 1.0620138928940394e-05, + "loss": 0.7743, + "step": 4910 + }, + { + "epoch": 1.39, + "learning_rate": 1.0529331715233795e-05, + "loss": 0.7971, + "step": 4920 + }, + { + "epoch": 1.4, + "learning_rate": 1.0438810712471553e-05, + "loss": 0.7812, + "step": 4930 + }, + { + "epoch": 1.4, + "learning_rate": 1.0348577711041021e-05, + "loss": 0.7788, + "step": 4940 + }, + { + "epoch": 1.4, + "learning_rate": 1.0258634495633277e-05, + "loss": 0.7866, + "step": 4950 + }, + { + "epoch": 1.4, + "learning_rate": 1.0168982845207797e-05, + "loss": 0.8023, + "step": 4960 + }, + { + "epoch": 1.41, + "learning_rate": 1.0079624532957316e-05, + "loss": 0.7766, + "step": 4970 + }, + { + "epoch": 1.41, + "learning_rate": 9.99056132627267e-06, + "loss": 0.7831, + "step": 4980 + }, + { + "epoch": 1.41, + "learning_rate": 9.901794986707941e-06, + "loss": 0.7927, + "step": 4990 + }, + { + "epoch": 1.42, + "learning_rate": 9.813327269945547e-06, + "loss": 0.7852, + "step": 5000 + }, + { + "epoch": 1.42, + "learning_rate": 9.725159925761532e-06, + "loss": 0.7649, + "step": 5010 + }, + { + "epoch": 1.42, + "learning_rate": 9.637294697990961e-06, + "loss": 0.7818, + "step": 5020 + }, + { + "epoch": 1.42, + "learning_rate": 9.549733324493431e-06, + "loss": 0.7789, + "step": 5030 + }, + { + "epoch": 1.43, + "learning_rate": 9.462477537118717e-06, + "loss": 0.7636, + "step": 5040 + }, + { + "epoch": 1.43, + "learning_rate": 9.375529061672467e-06, + "loss": 0.7832, + "step": 5050 + }, + { + "epoch": 1.43, + "learning_rate": 9.288889617882136e-06, + "loss": 0.7959, + "step": 5060 + }, + { + "epoch": 1.44, + "learning_rate": 9.202560919362896e-06, + "loss": 0.7896, + "step": 5070 + }, + { + "epoch": 1.44, + "learning_rate": 9.116544673583824e-06, + "loss": 0.781, + "step": 5080 + }, + { + "epoch": 1.44, + "learning_rate": 9.030842581834062e-06, + "loss": 0.7876, + "step": 5090 + }, + { + "epoch": 1.44, + "learning_rate": 8.945456339189198e-06, + "loss": 0.7818, + "step": 5100 + }, + { + "epoch": 1.45, + "learning_rate": 8.860387634477736e-06, + "loss": 0.7851, + "step": 5110 + }, + { + "epoch": 1.45, + "learning_rate": 8.775638150247714e-06, + "loss": 0.7824, + "step": 5120 + }, + { + "epoch": 1.45, + "learning_rate": 8.691209562733371e-06, + "loss": 0.7988, + "step": 5130 + }, + { + "epoch": 1.46, + "learning_rate": 8.607103541822068e-06, + "loss": 0.7771, + "step": 5140 + }, + { + "epoch": 1.46, + "learning_rate": 8.523321751021176e-06, + "loss": 0.7888, + "step": 5150 + }, + { + "epoch": 1.46, + "learning_rate": 8.43986584742526e-06, + "loss": 0.794, + "step": 5160 + }, + { + "epoch": 1.46, + "learning_rate": 8.35673748168323e-06, + "loss": 0.7854, + "step": 5170 + }, + { + "epoch": 1.47, + "learning_rate": 8.273938297965736e-06, + "loss": 0.7927, + "step": 5180 + }, + { + "epoch": 1.47, + "learning_rate": 8.191469933932625e-06, + "loss": 0.801, + "step": 5190 + }, + { + "epoch": 1.47, + "learning_rate": 8.109334020700591e-06, + "loss": 0.7816, + "step": 5200 + }, + { + "epoch": 1.48, + "learning_rate": 8.027532182810845e-06, + "loss": 0.7912, + "step": 5210 + }, + { + "epoch": 1.48, + "learning_rate": 7.946066038197065e-06, + "loss": 0.7818, + "step": 5220 + }, + { + "epoch": 1.48, + "learning_rate": 7.86493719815333e-06, + "loss": 0.7833, + "step": 5230 + }, + { + "epoch": 1.48, + "learning_rate": 7.784147267302274e-06, + "loss": 0.7919, + "step": 5240 + }, + { + "epoch": 1.49, + "learning_rate": 7.70369784356336e-06, + "loss": 0.771, + "step": 5250 + }, + { + "epoch": 1.49, + "learning_rate": 7.62359051812124e-06, + "loss": 0.7887, + "step": 5260 + }, + { + "epoch": 1.49, + "learning_rate": 7.543826875394347e-06, + "loss": 0.7744, + "step": 5270 + }, + { + "epoch": 1.49, + "learning_rate": 7.464408493003483e-06, + "loss": 0.7887, + "step": 5280 + }, + { + "epoch": 1.5, + "learning_rate": 7.385336941740678e-06, + "loss": 0.7638, + "step": 5290 + }, + { + "epoch": 1.5, + "learning_rate": 7.306613785538066e-06, + "loss": 0.7778, + "step": 5300 + }, + { + "epoch": 1.5, + "learning_rate": 7.2282405814370125e-06, + "loss": 0.7769, + "step": 5310 + }, + { + "epoch": 1.51, + "learning_rate": 7.150218879557263e-06, + "loss": 0.7916, + "step": 5320 + }, + { + "epoch": 1.51, + "learning_rate": 7.072550223066321e-06, + "loss": 0.7798, + "step": 5330 + }, + { + "epoch": 1.51, + "learning_rate": 6.9952361481488896e-06, + "loss": 0.7733, + "step": 5340 + }, + { + "epoch": 1.51, + "learning_rate": 6.918278183976554e-06, + "loss": 0.7701, + "step": 5350 + }, + { + "epoch": 1.52, + "learning_rate": 6.841677852677447e-06, + "loss": 0.7792, + "step": 5360 + }, + { + "epoch": 1.52, + "learning_rate": 6.765436669306227e-06, + "loss": 0.7863, + "step": 5370 + }, + { + "epoch": 1.52, + "learning_rate": 6.689556141814043e-06, + "loss": 0.7821, + "step": 5380 + }, + { + "epoch": 1.53, + "learning_rate": 6.614037771018775e-06, + "loss": 0.7896, + "step": 5390 + }, + { + "epoch": 1.53, + "learning_rate": 6.538883050575284e-06, + "loss": 0.7943, + "step": 5400 + }, + { + "epoch": 1.53, + "learning_rate": 6.464093466945919e-06, + "loss": 0.7933, + "step": 5410 + }, + { + "epoch": 1.53, + "learning_rate": 6.389670499371089e-06, + "loss": 0.7773, + "step": 5420 + }, + { + "epoch": 1.54, + "learning_rate": 6.3156156198400315e-06, + "loss": 0.7828, + "step": 5430 + }, + { + "epoch": 1.54, + "learning_rate": 6.241930293061662e-06, + "loss": 0.7769, + "step": 5440 + }, + { + "epoch": 1.54, + "learning_rate": 6.16861597643564e-06, + "loss": 0.7726, + "step": 5450 + }, + { + "epoch": 1.55, + "learning_rate": 6.0956741200235315e-06, + "loss": 0.7956, + "step": 5460 + }, + { + "epoch": 1.55, + "learning_rate": 6.023106166520104e-06, + "loss": 0.7932, + "step": 5470 + }, + { + "epoch": 1.55, + "learning_rate": 5.950913551224838e-06, + "loss": 0.7849, + "step": 5480 + }, + { + "epoch": 1.55, + "learning_rate": 5.879097702013495e-06, + "loss": 0.7968, + "step": 5490 + }, + { + "epoch": 1.56, + "learning_rate": 5.807660039309904e-06, + "loss": 0.7827, + "step": 5500 + }, + { + "epoch": 1.56, + "learning_rate": 5.736601976057848e-06, + "loss": 0.791, + "step": 5510 + }, + { + "epoch": 1.56, + "learning_rate": 5.66592491769315e-06, + "loss": 0.7792, + "step": 5520 + }, + { + "epoch": 1.57, + "learning_rate": 5.595630262115825e-06, + "loss": 0.7808, + "step": 5530 + }, + { + "epoch": 1.57, + "learning_rate": 5.525719399662488e-06, + "loss": 0.7723, + "step": 5540 + }, + { + "epoch": 1.57, + "learning_rate": 5.456193713078797e-06, + "loss": 0.7789, + "step": 5550 + }, + { + "epoch": 1.57, + "learning_rate": 5.387054577492165e-06, + "loss": 0.7903, + "step": 5560 + }, + { + "epoch": 1.58, + "learning_rate": 5.318303360384508e-06, + "loss": 0.7801, + "step": 5570 + }, + { + "epoch": 1.58, + "learning_rate": 5.249941421565227e-06, + "loss": 0.7733, + "step": 5580 + }, + { + "epoch": 1.58, + "learning_rate": 5.181970113144296e-06, + "loss": 0.7891, + "step": 5590 + }, + { + "epoch": 1.59, + "learning_rate": 5.114390779505557e-06, + "loss": 0.7912, + "step": 5600 + }, + { + "epoch": 1.59, + "learning_rate": 5.047204757280072e-06, + "loss": 0.7917, + "step": 5610 + }, + { + "epoch": 1.59, + "learning_rate": 4.980413375319737e-06, + "loss": 0.7922, + "step": 5620 + }, + { + "epoch": 1.59, + "learning_rate": 4.914017954670961e-06, + "loss": 0.79, + "step": 5630 + }, + { + "epoch": 1.6, + "learning_rate": 4.8480198085485765e-06, + "loss": 0.7844, + "step": 5640 + }, + { + "epoch": 1.6, + "learning_rate": 4.782420242309821e-06, + "loss": 0.7855, + "step": 5650 + }, + { + "epoch": 1.6, + "learning_rate": 4.717220553428559e-06, + "loss": 0.779, + "step": 5660 + }, + { + "epoch": 1.61, + "learning_rate": 4.652422031469583e-06, + "loss": 0.7864, + "step": 5670 + }, + { + "epoch": 1.61, + "learning_rate": 4.58802595806315e-06, + "loss": 0.7802, + "step": 5680 + }, + { + "epoch": 1.61, + "learning_rate": 4.524033606879602e-06, + "loss": 0.7776, + "step": 5690 + }, + { + "epoch": 1.61, + "learning_rate": 4.460446243604169e-06, + "loss": 0.778, + "step": 5700 + }, + { + "epoch": 1.62, + "learning_rate": 4.3972651259119706e-06, + "loss": 0.7834, + "step": 5710 + }, + { + "epoch": 1.62, + "learning_rate": 4.3344915034431e-06, + "loss": 0.7875, + "step": 5720 + }, + { + "epoch": 1.62, + "learning_rate": 4.272126617777933e-06, + "loss": 0.787, + "step": 5730 + }, + { + "epoch": 1.63, + "learning_rate": 4.2101717024125576e-06, + "loss": 0.7773, + "step": 5740 + }, + { + "epoch": 1.63, + "learning_rate": 4.148627982734404e-06, + "loss": 0.7853, + "step": 5750 + }, + { + "epoch": 1.63, + "learning_rate": 4.087496675997965e-06, + "loss": 0.7917, + "step": 5760 + }, + { + "epoch": 1.63, + "learning_rate": 4.026778991300762e-06, + "loss": 0.7907, + "step": 5770 + }, + { + "epoch": 1.64, + "learning_rate": 3.966476129559391e-06, + "loss": 0.7764, + "step": 5780 + }, + { + "epoch": 1.64, + "learning_rate": 3.90658928348582e-06, + "loss": 0.7718, + "step": 5790 + }, + { + "epoch": 1.64, + "learning_rate": 3.847119637563739e-06, + "loss": 0.791, + "step": 5800 + }, + { + "epoch": 1.64, + "learning_rate": 3.7880683680251855e-06, + "loss": 0.7732, + "step": 5810 + }, + { + "epoch": 1.65, + "learning_rate": 3.7294366428272386e-06, + "loss": 0.7621, + "step": 5820 + }, + { + "epoch": 1.65, + "learning_rate": 3.6712256216289624e-06, + "loss": 0.7619, + "step": 5830 + }, + { + "epoch": 1.65, + "learning_rate": 3.613436455768418e-06, + "loss": 0.782, + "step": 5840 + }, + { + "epoch": 1.66, + "learning_rate": 3.5560702882399406e-06, + "loss": 0.7853, + "step": 5850 + }, + { + "epoch": 1.66, + "learning_rate": 3.499128253671494e-06, + "loss": 0.7896, + "step": 5860 + }, + { + "epoch": 1.66, + "learning_rate": 3.4426114783022546e-06, + "loss": 0.7939, + "step": 5870 + }, + { + "epoch": 1.66, + "learning_rate": 3.3865210799603253e-06, + "loss": 0.7734, + "step": 5880 + }, + { + "epoch": 1.67, + "learning_rate": 3.3308581680406182e-06, + "loss": 0.7951, + "step": 5890 + }, + { + "epoch": 1.67, + "learning_rate": 3.275623843482939e-06, + "loss": 0.7892, + "step": 5900 + }, + { + "epoch": 1.67, + "learning_rate": 3.220819198750172e-06, + "loss": 0.7788, + "step": 5910 + }, + { + "epoch": 1.68, + "learning_rate": 3.166445317806721e-06, + "loss": 0.8137, + "step": 5920 + }, + { + "epoch": 1.68, + "learning_rate": 3.1125032760970203e-06, + "loss": 0.7665, + "step": 5930 + }, + { + "epoch": 1.68, + "learning_rate": 3.0589941405243043e-06, + "loss": 0.7812, + "step": 5940 + }, + { + "epoch": 1.68, + "learning_rate": 3.0059189694294774e-06, + "loss": 0.7824, + "step": 5950 + }, + { + "epoch": 1.69, + "learning_rate": 2.953278812570201e-06, + "loss": 0.7736, + "step": 5960 + }, + { + "epoch": 1.69, + "learning_rate": 2.9010747111001103e-06, + "loss": 0.7759, + "step": 5970 + }, + { + "epoch": 1.69, + "learning_rate": 2.849307697548251e-06, + "loss": 0.7946, + "step": 5980 + }, + { + "epoch": 1.7, + "learning_rate": 2.7979787957986225e-06, + "loss": 0.7938, + "step": 5990 + }, + { + "epoch": 1.7, + "learning_rate": 2.7470890210699596e-06, + "loss": 0.7818, + "step": 6000 + }, + { + "epoch": 1.7, + "learning_rate": 2.6966393798956242e-06, + "loss": 0.7773, + "step": 6010 + }, + { + "epoch": 1.7, + "learning_rate": 2.6466308701037253e-06, + "loss": 0.7779, + "step": 6020 + }, + { + "epoch": 1.71, + "learning_rate": 2.597064480797351e-06, + "loss": 0.7981, + "step": 6030 + }, + { + "epoch": 1.71, + "learning_rate": 2.547941192335035e-06, + "loss": 0.7881, + "step": 6040 + }, + { + "epoch": 1.71, + "learning_rate": 2.4992619763113427e-06, + "loss": 0.7772, + "step": 6050 + }, + { + "epoch": 1.72, + "learning_rate": 2.4510277955376885e-06, + "loss": 0.7812, + "step": 6060 + }, + { + "epoch": 1.72, + "learning_rate": 2.403239604023244e-06, + "loss": 0.7753, + "step": 6070 + }, + { + "epoch": 1.72, + "learning_rate": 2.360612333857401e-06, + "loss": 0.7778, + "step": 6080 + }, + { + "epoch": 1.72, + "learning_rate": 2.31367411862298e-06, + "loss": 0.7883, + "step": 6090 + }, + { + "epoch": 1.73, + "learning_rate": 2.2671846093243493e-06, + "loss": 0.7885, + "step": 6100 + }, + { + "epoch": 1.73, + "learning_rate": 2.221144725463359e-06, + "loss": 0.7876, + "step": 6110 + }, + { + "epoch": 1.73, + "learning_rate": 2.1755553776488745e-06, + "loss": 0.8012, + "step": 6120 + }, + { + "epoch": 1.74, + "learning_rate": 2.130417467578724e-06, + "loss": 0.7967, + "step": 6130 + }, + { + "epoch": 1.74, + "learning_rate": 2.0857318880218995e-06, + "loss": 0.7827, + "step": 6140 + }, + { + "epoch": 1.74, + "learning_rate": 2.0414995228008743e-06, + "loss": 0.7657, + "step": 6150 + }, + { + "epoch": 1.74, + "learning_rate": 1.997721246774145e-06, + "loss": 0.7655, + "step": 6160 + }, + { + "epoch": 1.75, + "learning_rate": 1.9543979258189126e-06, + "loss": 0.7713, + "step": 6170 + }, + { + "epoch": 1.75, + "learning_rate": 1.911530416813953e-06, + "loss": 0.7871, + "step": 6180 + }, + { + "epoch": 1.75, + "learning_rate": 1.869119567622679e-06, + "loss": 0.7983, + "step": 6190 + }, + { + "epoch": 1.76, + "learning_rate": 1.8271662170763787e-06, + "loss": 0.8057, + "step": 6200 + }, + { + "epoch": 1.76, + "learning_rate": 1.7856711949575972e-06, + "loss": 0.7798, + "step": 6210 + }, + { + "epoch": 1.76, + "learning_rate": 1.7446353219837592e-06, + "loss": 0.7845, + "step": 6220 + }, + { + "epoch": 1.76, + "learning_rate": 1.704059409790898e-06, + "loss": 0.7907, + "step": 6230 + }, + { + "epoch": 1.77, + "learning_rate": 1.6639442609176409e-06, + "loss": 0.778, + "step": 6240 + }, + { + "epoch": 1.77, + "learning_rate": 1.6242906687893077e-06, + "loss": 0.7924, + "step": 6250 + }, + { + "epoch": 1.77, + "learning_rate": 1.5850994177022265e-06, + "loss": 0.7988, + "step": 6260 + }, + { + "epoch": 1.78, + "learning_rate": 1.546371282808226e-06, + "loss": 0.7741, + "step": 6270 + }, + { + "epoch": 1.78, + "learning_rate": 1.508107030099304e-06, + "loss": 0.7944, + "step": 6280 + }, + { + "epoch": 1.78, + "learning_rate": 1.4703074163924718e-06, + "loss": 0.7845, + "step": 6290 + }, + { + "epoch": 1.78, + "learning_rate": 1.4329731893147792e-06, + "loss": 0.7832, + "step": 6300 + }, + { + "epoch": 1.79, + "learning_rate": 1.396105087288549e-06, + "loss": 0.7933, + "step": 6310 + }, + { + "epoch": 1.79, + "learning_rate": 1.3597038395167516e-06, + "loss": 0.7803, + "step": 6320 + }, + { + "epoch": 1.79, + "learning_rate": 1.3237701659685854e-06, + "loss": 0.7794, + "step": 6330 + }, + { + "epoch": 1.8, + "learning_rate": 1.28830477736524e-06, + "loss": 0.7715, + "step": 6340 + }, + { + "epoch": 1.8, + "learning_rate": 1.253308375165857e-06, + "loss": 0.7918, + "step": 6350 + }, + { + "epoch": 1.8, + "learning_rate": 1.2187816515536105e-06, + "loss": 0.7829, + "step": 6360 + }, + { + "epoch": 1.8, + "learning_rate": 1.184725289422073e-06, + "loss": 0.7932, + "step": 6370 + }, + { + "epoch": 1.81, + "learning_rate": 1.151139962361658e-06, + "loss": 0.7838, + "step": 6380 + }, + { + "epoch": 1.81, + "learning_rate": 1.1180263346463327e-06, + "loss": 0.7767, + "step": 6390 + }, + { + "epoch": 1.81, + "learning_rate": 1.0853850612204646e-06, + "loss": 0.7757, + "step": 6400 + }, + { + "epoch": 1.81, + "learning_rate": 1.053216787685865e-06, + "loss": 0.779, + "step": 6410 + }, + { + "epoch": 1.82, + "learning_rate": 1.0215221502890254e-06, + "loss": 0.7789, + "step": 6420 + }, + { + "epoch": 1.82, + "learning_rate": 9.903017759085365e-07, + "loss": 0.7738, + "step": 6430 + }, + { + "epoch": 1.82, + "learning_rate": 9.595562820426758e-07, + "loss": 0.7873, + "step": 6440 + }, + { + "epoch": 1.83, + "learning_rate": 9.292862767972199e-07, + "loss": 0.7923, + "step": 6450 + }, + { + "epoch": 1.83, + "learning_rate": 8.994923588733856e-07, + "loss": 0.7888, + "step": 6460 + }, + { + "epoch": 1.83, + "learning_rate": 8.701751175560102e-07, + "loss": 0.7749, + "step": 6470 + }, + { + "epoch": 1.83, + "learning_rate": 8.41335132701887e-07, + "loss": 0.7706, + "step": 6480 + }, + { + "epoch": 1.84, + "learning_rate": 8.129729747283016e-07, + "loss": 0.7896, + "step": 6490 + }, + { + "epoch": 1.84, + "learning_rate": 7.85089204601741e-07, + "loss": 0.7918, + "step": 6500 + }, + { + "epoch": 1.84, + "learning_rate": 7.576843738268113e-07, + "loss": 0.7875, + "step": 6510 + }, + { + "epoch": 1.85, + "learning_rate": 7.307590244353263e-07, + "loss": 0.7871, + "step": 6520 + }, + { + "epoch": 1.85, + "learning_rate": 7.043136889755691e-07, + "loss": 0.7734, + "step": 6530 + }, + { + "epoch": 1.85, + "learning_rate": 6.783488905017871e-07, + "loss": 0.7856, + "step": 6540 + }, + { + "epoch": 1.85, + "learning_rate": 6.528651425638272e-07, + "loss": 0.7964, + "step": 6550 + }, + { + "epoch": 1.86, + "learning_rate": 6.278629491969862e-07, + "loss": 0.778, + "step": 6560 + }, + { + "epoch": 1.86, + "learning_rate": 6.033428049120326e-07, + "loss": 0.7914, + "step": 6570 + }, + { + "epoch": 1.86, + "learning_rate": 5.793051946854422e-07, + "loss": 0.7691, + "step": 6580 + }, + { + "epoch": 1.87, + "learning_rate": 5.557505939497915e-07, + "loss": 0.7893, + "step": 6590 + }, + { + "epoch": 1.87, + "learning_rate": 5.326794685843655e-07, + "loss": 0.7833, + "step": 6600 + }, + { + "epoch": 1.87, + "learning_rate": 5.100922749059239e-07, + "loss": 0.7903, + "step": 6610 + }, + { + "epoch": 1.87, + "learning_rate": 4.879894596597018e-07, + "loss": 0.7683, + "step": 6620 + }, + { + "epoch": 1.88, + "learning_rate": 4.663714600105534e-07, + "loss": 0.7717, + "step": 6630 + }, + { + "epoch": 1.88, + "learning_rate": 4.452387035343203e-07, + "loss": 0.7876, + "step": 6640 + }, + { + "epoch": 1.88, + "learning_rate": 4.2459160820935153e-07, + "loss": 0.7888, + "step": 6650 + }, + { + "epoch": 1.89, + "learning_rate": 4.044305824082717e-07, + "loss": 0.7729, + "step": 6660 + }, + { + "epoch": 1.89, + "learning_rate": 3.84756024889868e-07, + "loss": 0.7824, + "step": 6670 + }, + { + "epoch": 1.89, + "learning_rate": 3.6556832479123504e-07, + "loss": 0.7662, + "step": 6680 + }, + { + "epoch": 1.89, + "learning_rate": 3.468678616200427e-07, + "loss": 0.7981, + "step": 6690 + }, + { + "epoch": 1.9, + "learning_rate": 3.2865500524707217e-07, + "loss": 0.7806, + "step": 6700 + }, + { + "epoch": 1.9, + "learning_rate": 3.109301158988609e-07, + "loss": 0.7858, + "step": 6710 + }, + { + "epoch": 1.9, + "learning_rate": 2.936935441506028e-07, + "loss": 0.7827, + "step": 6720 + }, + { + "epoch": 1.91, + "learning_rate": 2.769456309192037e-07, + "loss": 0.7784, + "step": 6730 + }, + { + "epoch": 1.91, + "learning_rate": 2.6068670745654224e-07, + "loss": 0.7761, + "step": 6740 + }, + { + "epoch": 1.91, + "learning_rate": 2.449170953429225e-07, + "loss": 0.7732, + "step": 6750 + }, + { + "epoch": 1.91, + "learning_rate": 2.296371064806957e-07, + "loss": 0.7899, + "step": 6760 + }, + { + "epoch": 1.92, + "learning_rate": 2.1484704308812053e-07, + "loss": 0.7839, + "step": 6770 + }, + { + "epoch": 1.92, + "learning_rate": 2.0054719769335428e-07, + "loss": 0.7831, + "step": 6780 + }, + { + "epoch": 1.92, + "learning_rate": 1.8673785312869063e-07, + "loss": 0.7817, + "step": 6790 + }, + { + "epoch": 1.93, + "learning_rate": 1.7341928252495033e-07, + "loss": 0.792, + "step": 6800 + }, + { + "epoch": 1.93, + "learning_rate": 1.60591749306091e-07, + "loss": 0.7942, + "step": 6810 + }, + { + "epoch": 1.93, + "learning_rate": 1.4825550718398362e-07, + "loss": 0.7607, + "step": 6820 + }, + { + "epoch": 1.93, + "learning_rate": 1.3641080015341369e-07, + "loss": 0.7743, + "step": 6830 + }, + { + "epoch": 1.94, + "learning_rate": 1.2505786248723229e-07, + "loss": 0.763, + "step": 6840 + }, + { + "epoch": 1.94, + "learning_rate": 1.1419691873174043e-07, + "loss": 0.7685, + "step": 6850 + }, + { + "epoch": 1.94, + "learning_rate": 1.038281837022398e-07, + "loss": 0.7773, + "step": 6860 + }, + { + "epoch": 1.95, + "learning_rate": 9.395186247878329e-08, + "loss": 0.7663, + "step": 6870 + }, + { + "epoch": 1.95, + "learning_rate": 8.456815040212562e-08, + "loss": 0.7769, + "step": 6880 + }, + { + "epoch": 1.95, + "learning_rate": 7.567723306984853e-08, + "loss": 0.7921, + "step": 6890 + }, + { + "epoch": 1.95, + "learning_rate": 6.727928633270264e-08, + "loss": 0.7877, + "step": 6900 + }, + { + "epoch": 1.96, + "learning_rate": 5.937447629112414e-08, + "loss": 0.7709, + "step": 6910 + }, + { + "epoch": 1.96, + "learning_rate": 5.196295929193739e-08, + "loss": 0.7921, + "step": 6920 + }, + { + "epoch": 1.96, + "learning_rate": 4.5044881925287994e-08, + "loss": 0.7707, + "step": 6930 + }, + { + "epoch": 1.96, + "learning_rate": 3.862038102172283e-08, + "loss": 0.7752, + "step": 6940 + }, + { + "epoch": 1.97, + "learning_rate": 3.268958364948671e-08, + "loss": 0.7728, + "step": 6950 + }, + { + "epoch": 1.97, + "learning_rate": 2.7252607112018823e-08, + "loss": 0.7651, + "step": 6960 + }, + { + "epoch": 1.97, + "learning_rate": 2.2309558945621257e-08, + "loss": 0.7892, + "step": 6970 + }, + { + "epoch": 1.98, + "learning_rate": 1.7860536917341243e-08, + "loss": 0.7671, + "step": 6980 + }, + { + "epoch": 1.98, + "learning_rate": 1.3905629023031052e-08, + "loss": 0.7767, + "step": 6990 + }, + { + "epoch": 1.98, + "learning_rate": 1.0444913485610498e-08, + "loss": 0.7847, + "step": 7000 + } + ], + "max_steps": 7064, + "num_train_epochs": 2, + "total_flos": 1.2562705410454192e+19, + "trial_name": null, + "trial_params": null +} diff --git a/sft-qlora/checkpoint-7000/training_args.bin b/sft-qlora/checkpoint-7000/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..e8bd5ea7554270f553d5441a16ce5f0105c78887 --- /dev/null +++ b/sft-qlora/checkpoint-7000/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:131cb9a8eab84a15c7b110e05a98a526550eba69b35fa4c758b43a4caafa6db7 +size 3275 diff --git a/sft-qlora/finetuning_args.json b/sft-qlora/finetuning_args.json new file mode 100644 index 0000000000000000000000000000000000000000..36a921b3eb84159ad54e7697e9d7d3e2fde38fec --- /dev/null +++ b/sft-qlora/finetuning_args.json @@ -0,0 +1,13 @@ +{ + "finetuning_type": "lora", + "lora_alpha": 32.0, + "lora_dropout": 0.1, + "lora_rank": 8, + "lora_target": [ + "q_proj", + "v_proj" + ], + "name_module_trainable": "mlp", + "num_hidden_layers": 32, + "num_layer_trainable": 3 +} diff --git a/sft-qlora/train_results.json b/sft-qlora/train_results.json new file mode 100644 index 0000000000000000000000000000000000000000..fbc8abca687789f58146a86e9665e52ea5ca99cc --- /dev/null +++ b/sft-qlora/train_results.json @@ -0,0 +1,7 @@ +{ + "epoch": 2.0, + "train_loss": 0.8239178928553991, + "train_runtime": 71865.5404, + "train_samples_per_second": 6.291, + "train_steps_per_second": 0.098 +} \ No newline at end of file diff --git a/sft-qlora/trainer_log.jsonl b/sft-qlora/trainer_log.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..f0282ac9f74a37ce4e7b0e8bd75d587c09719f1a --- /dev/null +++ b/sft-qlora/trainer_log.jsonl @@ -0,0 +1,2824 @@ +{"current_steps": 10, "total_steps": 7064, "loss": 1.3185, "reward": null, "learning_rate": 4.9999752766303955e-05, "epoch": 0.0, "percentage": 0.14, "elapsed_time": "0:01:34", "remaining_time": "18:35:59"} +{"current_steps": 10, "total_steps": 7064, "loss": 1.3185, "reward": null, "learning_rate": 4.9999752766303955e-05, "epoch": 0.0, "percentage": 0.14, "elapsed_time": "0:01:32", "remaining_time": "18:12:17"} +{"current_steps": 10, "total_steps": 7064, "loss": 1.3185, "reward": null, "learning_rate": 4.9999752766303955e-05, "epoch": 0.0, "percentage": 0.14, "elapsed_time": "0:01:33", "remaining_time": "18:23:15"} +{"current_steps": 10, "total_steps": 7064, "loss": 1.3185, "reward": null, "learning_rate": 4.9999752766303955e-05, "epoch": 0.0, "percentage": 0.14, "elapsed_time": "0:05:26", "remaining_time": "2 days, 15:55:14"} +{"current_steps": 20, "total_steps": 7064, "loss": 1.2795, "reward": null, "learning_rate": 4.999901107010577e-05, "epoch": 0.01, "percentage": 0.28, "elapsed_time": "0:07:00", "remaining_time": "1 day, 17:09:04"} +{"current_steps": 20, "total_steps": 7064, "loss": 1.2795, "reward": null, "learning_rate": 4.999901107010577e-05, "epoch": 0.01, "percentage": 0.28, "elapsed_time": "0:03:09", "remaining_time": "18:31:22"} +{"current_steps": 20, "total_steps": 7064, "loss": 1.2795, "reward": null, "learning_rate": 4.999901107010577e-05, "epoch": 0.01, "percentage": 0.28, "elapsed_time": "0:03:08", "remaining_time": "18:25:01"} +{"current_steps": 20, "total_steps": 7064, "loss": 1.2795, "reward": null, "learning_rate": 4.999901107010577e-05, "epoch": 0.01, "percentage": 0.28, "elapsed_time": "0:03:07", "remaining_time": "18:19:32"} +{"current_steps": 30, "total_steps": 7064, "loss": 1.2266, "reward": null, "learning_rate": 4.999777492607524e-05, "epoch": 0.01, "percentage": 0.42, "elapsed_time": "0:04:44", "remaining_time": "18:32:14"} +{"current_steps": 30, "total_steps": 7064, "loss": 1.2266, "reward": null, "learning_rate": 4.999777492607524e-05, "epoch": 0.01, "percentage": 0.42, "elapsed_time": "0:08:37", "remaining_time": "1 day, 9:40:19"} +{"current_steps": 30, "total_steps": 7064, "loss": 1.2266, "reward": null, "learning_rate": 4.999777492607524e-05, "epoch": 0.01, "percentage": 0.42, "elapsed_time": "0:04:43", "remaining_time": "18:28:35"} +{"current_steps": 30, "total_steps": 7064, "loss": 1.2266, "reward": null, "learning_rate": 4.999777492607524e-05, "epoch": 0.01, "percentage": 0.42, "elapsed_time": "0:04:45", "remaining_time": "18:36:28"} +{"current_steps": 40, "total_steps": 7064, "loss": 1.19, "reward": null, "learning_rate": 4.9996044358661676e-05, "epoch": 0.01, "percentage": 0.57, "elapsed_time": "0:06:23", "remaining_time": "18:42:37"} +{"current_steps": 40, "total_steps": 7064, "loss": 1.19, "reward": null, "learning_rate": 4.9996044358661676e-05, "epoch": 0.01, "percentage": 0.57, "elapsed_time": "0:10:14", "remaining_time": "1 day, 5:59:32"} +{"current_steps": 40, "total_steps": 7064, "loss": 1.19, "reward": null, "learning_rate": 4.9996044358661676e-05, "epoch": 0.01, "percentage": 0.57, "elapsed_time": "0:06:21", "remaining_time": "18:36:43"} +{"current_steps": 40, "total_steps": 7064, "loss": 1.19, "reward": null, "learning_rate": 4.9996044358661676e-05, "epoch": 0.01, "percentage": 0.57, "elapsed_time": "0:06:22", "remaining_time": "18:39:27"} +{"current_steps": 50, "total_steps": 7064, "loss": 1.1643, "reward": null, "learning_rate": 4.9993819402093446e-05, "epoch": 0.01, "percentage": 0.71, "elapsed_time": "0:08:02", "remaining_time": "18:47:26"} +{"current_steps": 50, "total_steps": 7064, "loss": 1.1643, "reward": null, "learning_rate": 4.9993819402093446e-05, "epoch": 0.01, "percentage": 0.71, "elapsed_time": "0:08:00", "remaining_time": "18:42:44"} +{"current_steps": 50, "total_steps": 7064, "loss": 1.1643, "reward": null, "learning_rate": 4.9993819402093446e-05, "epoch": 0.01, "percentage": 0.71, "elapsed_time": "0:08:01", "remaining_time": "18:44:55"} +{"current_steps": 50, "total_steps": 7064, "loss": 1.1643, "reward": null, "learning_rate": 4.9993819402093446e-05, "epoch": 0.01, "percentage": 0.71, "elapsed_time": "0:11:53", "remaining_time": "1 day, 3:48:12"} +{"current_steps": 60, "total_steps": 7064, "loss": 1.1381, "reward": null, "learning_rate": 4.999110010037728e-05, "epoch": 0.02, "percentage": 0.85, "elapsed_time": "0:13:33", "remaining_time": "1 day, 2:21:56"} +{"current_steps": 60, "total_steps": 7064, "loss": 1.1381, "reward": null, "learning_rate": 4.999110010037728e-05, "epoch": 0.02, "percentage": 0.85, "elapsed_time": "0:09:40", "remaining_time": "18:49:50"} +{"current_steps": 60, "total_steps": 7064, "loss": 1.1381, "reward": null, "learning_rate": 4.999110010037728e-05, "epoch": 0.02, "percentage": 0.85, "elapsed_time": "0:09:39", "remaining_time": "18:48:01"} +{"current_steps": 60, "total_steps": 7064, "loss": 1.1381, "reward": null, "learning_rate": 4.999110010037728e-05, "epoch": 0.02, "percentage": 0.85, "elapsed_time": "0:09:41", "remaining_time": "18:51:56"} +{"current_steps": 70, "total_steps": 7064, "loss": 1.1113, "reward": null, "learning_rate": 4.998788650729743e-05, "epoch": 0.02, "percentage": 0.99, "elapsed_time": "0:15:13", "remaining_time": "1 day, 1:20:23"} +{"current_steps": 70, "total_steps": 7064, "loss": 1.1113, "reward": null, "learning_rate": 4.998788650729743e-05, "epoch": 0.02, "percentage": 0.99, "elapsed_time": "0:11:21", "remaining_time": "18:55:14"} +{"current_steps": 70, "total_steps": 7064, "loss": 1.1113, "reward": null, "learning_rate": 4.998788650729743e-05, "epoch": 0.02, "percentage": 0.99, "elapsed_time": "0:11:19", "remaining_time": "18:51:52"} +{"current_steps": 70, "total_steps": 7064, "loss": 1.1113, "reward": null, "learning_rate": 4.998788650729743e-05, "epoch": 0.02, "percentage": 0.99, "elapsed_time": "0:11:20", "remaining_time": "18:53:25"} +{"current_steps": 80, "total_steps": 7064, "loss": 1.0892, "reward": null, "learning_rate": 4.998417868641457e-05, "epoch": 0.02, "percentage": 1.13, "elapsed_time": "0:13:00", "remaining_time": "18:55:19"} +{"current_steps": 80, "total_steps": 7064, "loss": 1.0892, "reward": null, "learning_rate": 4.998417868641457e-05, "epoch": 0.02, "percentage": 1.13, "elapsed_time": "0:12:59", "remaining_time": "18:53:57"} +{"current_steps": 80, "total_steps": 7064, "loss": 1.0892, "reward": null, "learning_rate": 4.998417868641457e-05, "epoch": 0.02, "percentage": 1.13, "elapsed_time": "0:13:01", "remaining_time": "18:56:53"} +{"current_steps": 80, "total_steps": 7064, "loss": 1.0892, "reward": null, "learning_rate": 4.998417868641457e-05, "epoch": 0.02, "percentage": 1.13, "elapsed_time": "0:16:52", "remaining_time": "1 day, 0:33:25"} +{"current_steps": 90, "total_steps": 7064, "loss": 1.0801, "reward": null, "learning_rate": 4.9979976711064556e-05, "epoch": 0.03, "percentage": 1.27, "elapsed_time": "0:18:31", "remaining_time": "23:55:24"} +{"current_steps": 90, "total_steps": 7064, "loss": 1.0801, "reward": null, "learning_rate": 4.9979976711064556e-05, "epoch": 0.03, "percentage": 1.27, "elapsed_time": "0:14:40", "remaining_time": "18:56:42"} +{"current_steps": 90, "total_steps": 7064, "loss": 1.0801, "reward": null, "learning_rate": 4.9979976711064556e-05, "epoch": 0.03, "percentage": 1.27, "elapsed_time": "0:14:39", "remaining_time": "18:55:18"} +{"current_steps": 90, "total_steps": 7064, "loss": 1.0801, "reward": null, "learning_rate": 4.9979976711064556e-05, "epoch": 0.03, "percentage": 1.27, "elapsed_time": "0:14:38", "remaining_time": "18:54:05"} +{"current_steps": 100, "total_steps": 7064, "loss": 1.0822, "reward": null, "learning_rate": 4.9975280664357e-05, "epoch": 0.03, "percentage": 1.42, "elapsed_time": "0:20:13", "remaining_time": "23:28:03"} +{"current_steps": 100, "total_steps": 7064, "loss": 1.0822, "reward": null, "learning_rate": 4.9975280664357e-05, "epoch": 0.03, "percentage": 1.42, "elapsed_time": "0:16:21", "remaining_time": "18:59:35"} +{"current_steps": 100, "total_steps": 7064, "loss": 1.0822, "reward": null, "learning_rate": 4.9975280664357e-05, "epoch": 0.03, "percentage": 1.42, "elapsed_time": "0:16:20", "remaining_time": "18:58:20"} +{"current_steps": 100, "total_steps": 7064, "loss": 1.0822, "reward": null, "learning_rate": 4.9975280664357e-05, "epoch": 0.03, "percentage": 1.42, "elapsed_time": "0:16:19", "remaining_time": "18:57:15"} +{"current_steps": 110, "total_steps": 7064, "loss": 1.0794, "reward": null, "learning_rate": 4.997009063917356e-05, "epoch": 0.03, "percentage": 1.56, "elapsed_time": "0:18:00", "remaining_time": "18:58:00"} +{"current_steps": 110, "total_steps": 7064, "loss": 1.0794, "reward": null, "learning_rate": 4.997009063917356e-05, "epoch": 0.03, "percentage": 1.56, "elapsed_time": "0:21:52", "remaining_time": "23:02:51"} +{"current_steps": 110, "total_steps": 7064, "loss": 1.0794, "reward": null, "learning_rate": 4.997009063917356e-05, "epoch": 0.03, "percentage": 1.56, "elapsed_time": "0:17:59", "remaining_time": "18:57:01"} +{"current_steps": 110, "total_steps": 7064, "loss": 1.0794, "reward": null, "learning_rate": 4.997009063917356e-05, "epoch": 0.03, "percentage": 1.56, "elapsed_time": "0:18:01", "remaining_time": "18:59:09"} +{"current_steps": 120, "total_steps": 7064, "loss": 1.0419, "reward": null, "learning_rate": 4.996440673816617e-05, "epoch": 0.03, "percentage": 1.7, "elapsed_time": "0:23:33", "remaining_time": "22:43:01"} +{"current_steps": 120, "total_steps": 7064, "loss": 1.0419, "reward": null, "learning_rate": 4.996440673816617e-05, "epoch": 0.03, "percentage": 1.7, "elapsed_time": "0:19:41", "remaining_time": "18:59:57"} +{"current_steps": 120, "total_steps": 7064, "loss": 1.0419, "reward": null, "learning_rate": 4.996440673816617e-05, "epoch": 0.03, "percentage": 1.7, "elapsed_time": "0:19:39", "remaining_time": "18:58:00"} +{"current_steps": 120, "total_steps": 7064, "loss": 1.0419, "reward": null, "learning_rate": 4.996440673816617e-05, "epoch": 0.03, "percentage": 1.7, "elapsed_time": "0:19:40", "remaining_time": "18:58:54"} +{"current_steps": 130, "total_steps": 7064, "loss": 1.049, "reward": null, "learning_rate": 4.995822907375498e-05, "epoch": 0.04, "percentage": 1.84, "elapsed_time": "0:21:23", "remaining_time": "19:00:52"} +{"current_steps": 130, "total_steps": 7064, "loss": 1.049, "reward": null, "learning_rate": 4.995822907375498e-05, "epoch": 0.04, "percentage": 1.84, "elapsed_time": "0:21:21", "remaining_time": "18:59:04"} +{"current_steps": 130, "total_steps": 7064, "loss": 1.049, "reward": null, "learning_rate": 4.995822907375498e-05, "epoch": 0.04, "percentage": 1.84, "elapsed_time": "0:21:22", "remaining_time": "18:59:54"} +{"current_steps": 130, "total_steps": 7064, "loss": 1.049, "reward": null, "learning_rate": 4.995822907375498e-05, "epoch": 0.04, "percentage": 1.84, "elapsed_time": "0:25:14", "remaining_time": "22:26:29"} +{"current_steps": 140, "total_steps": 7064, "loss": 1.0202, "reward": null, "learning_rate": 4.9951557768126136e-05, "epoch": 0.04, "percentage": 1.98, "elapsed_time": "0:26:54", "remaining_time": "22:10:29"} +{"current_steps": 140, "total_steps": 7064, "loss": 1.0202, "reward": null, "learning_rate": 4.9951557768126136e-05, "epoch": 0.04, "percentage": 1.98, "elapsed_time": "0:23:01", "remaining_time": "18:58:56"} +{"current_steps": 140, "total_steps": 7064, "loss": 1.0202, "reward": null, "learning_rate": 4.9951557768126136e-05, "epoch": 0.04, "percentage": 1.98, "elapsed_time": "0:23:02", "remaining_time": "18:59:50"} +{"current_steps": 140, "total_steps": 7064, "loss": 1.0202, "reward": null, "learning_rate": 4.9951557768126136e-05, "epoch": 0.04, "percentage": 1.98, "elapsed_time": "0:23:00", "remaining_time": "18:58:10"} +{"current_steps": 150, "total_steps": 7064, "loss": 1.0226, "reward": null, "learning_rate": 4.9944392953229365e-05, "epoch": 0.04, "percentage": 2.12, "elapsed_time": "0:28:35", "remaining_time": "21:58:10"} +{"current_steps": 150, "total_steps": 7064, "loss": 1.0226, "reward": null, "learning_rate": 4.9944392953229365e-05, "epoch": 0.04, "percentage": 2.12, "elapsed_time": "0:24:44", "remaining_time": "19:00:29"} +{"current_steps": 150, "total_steps": 7064, "loss": 1.0226, "reward": null, "learning_rate": 4.9944392953229365e-05, "epoch": 0.04, "percentage": 2.12, "elapsed_time": "0:24:42", "remaining_time": "18:58:56"} +{"current_steps": 150, "total_steps": 7064, "loss": 1.0226, "reward": null, "learning_rate": 4.9944392953229365e-05, "epoch": 0.04, "percentage": 2.12, "elapsed_time": "0:24:43", "remaining_time": "18:59:39"} +{"current_steps": 160, "total_steps": 7064, "loss": 0.9927, "reward": null, "learning_rate": 4.993673477077535e-05, "epoch": 0.05, "percentage": 2.27, "elapsed_time": "0:30:21", "remaining_time": "21:49:37"} +{"current_steps": 160, "total_steps": 7064, "loss": 0.9927, "reward": null, "learning_rate": 4.993673477077535e-05, "epoch": 0.05, "percentage": 2.27, "elapsed_time": "0:26:29", "remaining_time": "19:03:16"} +{"current_steps": 160, "total_steps": 7064, "loss": 0.9927, "reward": null, "learning_rate": 4.993673477077535e-05, "epoch": 0.05, "percentage": 2.27, "elapsed_time": "0:26:27", "remaining_time": "19:01:49"} +{"current_steps": 160, "total_steps": 7064, "loss": 0.9927, "reward": null, "learning_rate": 4.993673477077535e-05, "epoch": 0.05, "percentage": 2.27, "elapsed_time": "0:26:28", "remaining_time": "19:02:30"} +{"current_steps": 170, "total_steps": 7064, "loss": 1.0006, "reward": null, "learning_rate": 4.9928583372232954e-05, "epoch": 0.05, "percentage": 2.41, "elapsed_time": "0:32:02", "remaining_time": "21:39:35"} +{"current_steps": 170, "total_steps": 7064, "loss": 1.0006, "reward": null, "learning_rate": 4.9928583372232954e-05, "epoch": 0.05, "percentage": 2.41, "elapsed_time": "0:28:11", "remaining_time": "19:03:15"} +{"current_steps": 170, "total_steps": 7064, "loss": 1.0006, "reward": null, "learning_rate": 4.9928583372232954e-05, "epoch": 0.05, "percentage": 2.41, "elapsed_time": "0:28:10", "remaining_time": "19:02:31"} +{"current_steps": 170, "total_steps": 7064, "loss": 1.0006, "reward": null, "learning_rate": 4.9928583372232954e-05, "epoch": 0.05, "percentage": 2.41, "elapsed_time": "0:28:09", "remaining_time": "19:01:53"} +{"current_steps": 180, "total_steps": 7064, "loss": 0.9999, "reward": null, "learning_rate": 4.991993891882622e-05, "epoch": 0.05, "percentage": 2.55, "elapsed_time": "0:33:44", "remaining_time": "21:30:09"} +{"current_steps": 180, "total_steps": 7064, "loss": 0.9999, "reward": null, "learning_rate": 4.991993891882622e-05, "epoch": 0.05, "percentage": 2.55, "elapsed_time": "0:29:52", "remaining_time": "19:02:43"} +{"current_steps": 180, "total_steps": 7064, "loss": 0.9999, "reward": null, "learning_rate": 4.991993891882622e-05, "epoch": 0.05, "percentage": 2.55, "elapsed_time": "0:29:50", "remaining_time": "19:01:26"} +{"current_steps": 180, "total_steps": 7064, "loss": 0.9999, "reward": null, "learning_rate": 4.991993891882622e-05, "epoch": 0.05, "percentage": 2.55, "elapsed_time": "0:29:51", "remaining_time": "19:02:02"} +{"current_steps": 190, "total_steps": 7064, "loss": 1.0003, "reward": null, "learning_rate": 4.991080158153115e-05, "epoch": 0.05, "percentage": 2.69, "elapsed_time": "0:31:32", "remaining_time": "19:00:59"} +{"current_steps": 190, "total_steps": 7064, "loss": 1.0003, "reward": null, "learning_rate": 4.991080158153115e-05, "epoch": 0.05, "percentage": 2.69, "elapsed_time": "0:31:31", "remaining_time": "19:00:25"} +{"current_steps": 190, "total_steps": 7064, "loss": 1.0003, "reward": null, "learning_rate": 4.991080158153115e-05, "epoch": 0.05, "percentage": 2.69, "elapsed_time": "0:31:33", "remaining_time": "19:01:38"} +{"current_steps": 190, "total_steps": 7064, "loss": 1.0003, "reward": null, "learning_rate": 4.991080158153115e-05, "epoch": 0.05, "percentage": 2.69, "elapsed_time": "0:35:24", "remaining_time": "21:21:06"} +{"current_steps": 200, "total_steps": 7064, "loss": 0.9875, "reward": null, "learning_rate": 4.990117154107236e-05, "epoch": 0.06, "percentage": 2.83, "elapsed_time": "0:37:06", "remaining_time": "21:13:43"} +{"current_steps": 200, "total_steps": 7064, "loss": 0.9875, "reward": null, "learning_rate": 4.990117154107236e-05, "epoch": 0.06, "percentage": 2.83, "elapsed_time": "0:33:15", "remaining_time": "19:01:25"} +{"current_steps": 200, "total_steps": 7064, "loss": 0.9875, "reward": null, "learning_rate": 4.990117154107236e-05, "epoch": 0.06, "percentage": 2.83, "elapsed_time": "0:33:13", "remaining_time": "19:00:16"} +{"current_steps": 200, "total_steps": 7064, "loss": 0.9875, "reward": null, "learning_rate": 4.990117154107236e-05, "epoch": 0.06, "percentage": 2.83, "elapsed_time": "0:33:14", "remaining_time": "19:00:48"} +{"current_steps": 210, "total_steps": 7064, "loss": 1.004, "reward": null, "learning_rate": 4.989104898791949e-05, "epoch": 0.06, "percentage": 2.97, "elapsed_time": "0:38:47", "remaining_time": "21:06:01"} +{"current_steps": 210, "total_steps": 7064, "loss": 1.004, "reward": null, "learning_rate": 4.989104898791949e-05, "epoch": 0.06, "percentage": 2.97, "elapsed_time": "0:34:56", "remaining_time": "19:00:12"} +{"current_steps": 210, "total_steps": 7064, "loss": 1.004, "reward": null, "learning_rate": 4.989104898791949e-05, "epoch": 0.06, "percentage": 2.97, "elapsed_time": "0:34:55", "remaining_time": "18:59:36"} +{"current_steps": 210, "total_steps": 7064, "loss": 1.004, "reward": null, "learning_rate": 4.989104898791949e-05, "epoch": 0.06, "percentage": 2.97, "elapsed_time": "0:34:54", "remaining_time": "18:59:06"} +{"current_steps": 220, "total_steps": 7064, "loss": 0.9835, "reward": null, "learning_rate": 4.988043412228343e-05, "epoch": 0.06, "percentage": 3.11, "elapsed_time": "0:40:25", "remaining_time": "20:57:48"} +{"current_steps": 220, "total_steps": 7064, "loss": 0.9835, "reward": null, "learning_rate": 4.988043412228343e-05, "epoch": 0.06, "percentage": 3.11, "elapsed_time": "0:36:32", "remaining_time": "18:56:50"} +{"current_steps": 220, "total_steps": 7064, "loss": 0.9835, "reward": null, "learning_rate": 4.988043412228343e-05, "epoch": 0.06, "percentage": 3.11, "elapsed_time": "0:36:34", "remaining_time": "18:57:53"} +{"current_steps": 220, "total_steps": 7064, "loss": 0.9835, "reward": null, "learning_rate": 4.988043412228343e-05, "epoch": 0.06, "percentage": 3.11, "elapsed_time": "0:36:33", "remaining_time": "18:57:19"} +{"current_steps": 230, "total_steps": 7064, "loss": 0.9765, "reward": null, "learning_rate": 4.986932715411239e-05, "epoch": 0.07, "percentage": 3.26, "elapsed_time": "0:42:05", "remaining_time": "20:50:39"} +{"current_steps": 230, "total_steps": 7064, "loss": 0.9765, "reward": null, "learning_rate": 4.986932715411239e-05, "epoch": 0.07, "percentage": 3.26, "elapsed_time": "0:38:13", "remaining_time": "18:55:34"} +{"current_steps": 230, "total_steps": 7064, "loss": 0.9765, "reward": null, "learning_rate": 4.986932715411239e-05, "epoch": 0.07, "percentage": 3.26, "elapsed_time": "0:38:12", "remaining_time": "18:55:06"} +{"current_steps": 230, "total_steps": 7064, "loss": 0.9765, "reward": null, "learning_rate": 4.986932715411239e-05, "epoch": 0.07, "percentage": 3.26, "elapsed_time": "0:38:14", "remaining_time": "18:56:06"} +{"current_steps": 240, "total_steps": 7064, "loss": 0.9755, "reward": null, "learning_rate": 4.985772830308771e-05, "epoch": 0.07, "percentage": 3.4, "elapsed_time": "0:43:47", "remaining_time": "20:45:09"} +{"current_steps": 240, "total_steps": 7064, "loss": 0.9755, "reward": null, "learning_rate": 4.985772830308771e-05, "epoch": 0.07, "percentage": 3.4, "elapsed_time": "0:39:55", "remaining_time": "18:55:02"} +{"current_steps": 240, "total_steps": 7064, "loss": 0.9755, "reward": null, "learning_rate": 4.985772830308771e-05, "epoch": 0.07, "percentage": 3.4, "elapsed_time": "0:39:56", "remaining_time": "18:55:32"} +{"current_steps": 240, "total_steps": 7064, "loss": 0.9755, "reward": null, "learning_rate": 4.985772830308771e-05, "epoch": 0.07, "percentage": 3.4, "elapsed_time": "0:39:54", "remaining_time": "18:54:35"} +{"current_steps": 250, "total_steps": 7064, "loss": 0.9798, "reward": null, "learning_rate": 4.9845637798619536e-05, "epoch": 0.07, "percentage": 3.54, "elapsed_time": "0:45:29", "remaining_time": "20:39:46"} +{"current_steps": 250, "total_steps": 7064, "loss": 0.9798, "reward": null, "learning_rate": 4.9845637798619536e-05, "epoch": 0.07, "percentage": 3.54, "elapsed_time": "0:41:36", "remaining_time": "18:54:12"} +{"current_steps": 250, "total_steps": 7064, "loss": 0.9798, "reward": null, "learning_rate": 4.9845637798619536e-05, "epoch": 0.07, "percentage": 3.54, "elapsed_time": "0:41:37", "remaining_time": "18:54:41"} +{"current_steps": 250, "total_steps": 7064, "loss": 0.9798, "reward": null, "learning_rate": 4.9845637798619536e-05, "epoch": 0.07, "percentage": 3.54, "elapsed_time": "0:41:35", "remaining_time": "18:53:47"} +{"current_steps": 260, "total_steps": 7064, "loss": 0.9779, "reward": null, "learning_rate": 4.983305587984227e-05, "epoch": 0.07, "percentage": 3.68, "elapsed_time": "0:47:08", "remaining_time": "20:33:48"} +{"current_steps": 260, "total_steps": 7064, "loss": 0.9779, "reward": null, "learning_rate": 4.983305587984227e-05, "epoch": 0.07, "percentage": 3.68, "elapsed_time": "0:43:17", "remaining_time": "18:52:55"} +{"current_steps": 260, "total_steps": 7064, "loss": 0.9779, "reward": null, "learning_rate": 4.983305587984227e-05, "epoch": 0.07, "percentage": 3.68, "elapsed_time": "0:43:16", "remaining_time": "18:52:27"} +{"current_steps": 260, "total_steps": 7064, "loss": 0.9779, "reward": null, "learning_rate": 4.983305587984227e-05, "epoch": 0.07, "percentage": 3.68, "elapsed_time": "0:43:15", "remaining_time": "18:52:03"} +{"current_steps": 270, "total_steps": 7064, "loss": 0.9707, "reward": null, "learning_rate": 4.981998279560986e-05, "epoch": 0.08, "percentage": 3.82, "elapsed_time": "0:44:54", "remaining_time": "18:49:55"} +{"current_steps": 270, "total_steps": 7064, "loss": 0.9707, "reward": null, "learning_rate": 4.981998279560986e-05, "epoch": 0.08, "percentage": 3.82, "elapsed_time": "0:44:56", "remaining_time": "18:50:46"} +{"current_steps": 270, "total_steps": 7064, "loss": 0.9707, "reward": null, "learning_rate": 4.981998279560986e-05, "epoch": 0.08, "percentage": 3.82, "elapsed_time": "0:44:55", "remaining_time": "18:50:19"} +{"current_steps": 270, "total_steps": 7064, "loss": 0.9707, "reward": null, "learning_rate": 4.981998279560986e-05, "epoch": 0.08, "percentage": 3.82, "elapsed_time": "0:48:47", "remaining_time": "20:27:46"} +{"current_steps": 280, "total_steps": 7064, "loss": 0.987, "reward": null, "learning_rate": 4.980641880449086e-05, "epoch": 0.08, "percentage": 3.96, "elapsed_time": "0:50:27", "remaining_time": "20:22:27"} +{"current_steps": 280, "total_steps": 7064, "loss": 0.987, "reward": null, "learning_rate": 4.980641880449086e-05, "epoch": 0.08, "percentage": 3.96, "elapsed_time": "0:46:34", "remaining_time": "18:48:37"} +{"current_steps": 280, "total_steps": 7064, "loss": 0.987, "reward": null, "learning_rate": 4.980641880449086e-05, "epoch": 0.08, "percentage": 3.96, "elapsed_time": "0:46:33", "remaining_time": "18:48:14"} +{"current_steps": 280, "total_steps": 7064, "loss": 0.987, "reward": null, "learning_rate": 4.980641880449086e-05, "epoch": 0.08, "percentage": 3.96, "elapsed_time": "0:46:36", "remaining_time": "18:49:03"} +{"current_steps": 290, "total_steps": 7064, "loss": 0.9493, "reward": null, "learning_rate": 4.9792364174763323e-05, "epoch": 0.08, "percentage": 4.11, "elapsed_time": "0:52:07", "remaining_time": "20:17:37"} +{"current_steps": 290, "total_steps": 7064, "loss": 0.9493, "reward": null, "learning_rate": 4.9792364174763323e-05, "epoch": 0.08, "percentage": 4.11, "elapsed_time": "0:48:15", "remaining_time": "18:47:09"} +{"current_steps": 290, "total_steps": 7064, "loss": 0.9493, "reward": null, "learning_rate": 4.9792364174763323e-05, "epoch": 0.08, "percentage": 4.11, "elapsed_time": "0:48:16", "remaining_time": "18:47:35"} +{"current_steps": 290, "total_steps": 7064, "loss": 0.9493, "reward": null, "learning_rate": 4.9792364174763323e-05, "epoch": 0.08, "percentage": 4.11, "elapsed_time": "0:48:14", "remaining_time": "18:46:48"} +{"current_steps": 300, "total_steps": 7064, "loss": 0.9701, "reward": null, "learning_rate": 4.977781918440949e-05, "epoch": 0.08, "percentage": 4.25, "elapsed_time": "0:53:50", "remaining_time": "20:13:48"} +{"current_steps": 300, "total_steps": 7064, "loss": 0.9701, "reward": null, "learning_rate": 4.977781918440949e-05, "epoch": 0.08, "percentage": 4.25, "elapsed_time": "0:49:57", "remaining_time": "18:46:29"} +{"current_steps": 300, "total_steps": 7064, "loss": 0.9701, "reward": null, "learning_rate": 4.977781918440949e-05, "epoch": 0.08, "percentage": 4.25, "elapsed_time": "0:49:56", "remaining_time": "18:46:08"} +{"current_steps": 300, "total_steps": 7064, "loss": 0.9701, "reward": null, "learning_rate": 4.977781918440949e-05, "epoch": 0.08, "percentage": 4.25, "elapsed_time": "0:49:58", "remaining_time": "18:46:54"} +{"current_steps": 310, "total_steps": 7064, "loss": 0.9476, "reward": null, "learning_rate": 4.97627841211103e-05, "epoch": 0.09, "percentage": 4.39, "elapsed_time": "0:51:40", "remaining_time": "18:45:57"} +{"current_steps": 310, "total_steps": 7064, "loss": 0.9476, "reward": null, "learning_rate": 4.97627841211103e-05, "epoch": 0.09, "percentage": 4.39, "elapsed_time": "0:51:38", "remaining_time": "18:45:13"} +{"current_steps": 310, "total_steps": 7064, "loss": 0.9476, "reward": null, "learning_rate": 4.97627841211103e-05, "epoch": 0.09, "percentage": 4.39, "elapsed_time": "0:51:39", "remaining_time": "18:45:34"} +{"current_steps": 310, "total_steps": 7064, "loss": 0.9476, "reward": null, "learning_rate": 4.97627841211103e-05, "epoch": 0.09, "percentage": 4.39, "elapsed_time": "0:55:32", "remaining_time": "20:09:56"} +{"current_steps": 320, "total_steps": 7064, "loss": 0.9218, "reward": null, "learning_rate": 4.97472592822397e-05, "epoch": 0.09, "percentage": 4.53, "elapsed_time": "0:57:13", "remaining_time": "20:06:02"} +{"current_steps": 320, "total_steps": 7064, "loss": 0.9218, "reward": null, "learning_rate": 4.97472592822397e-05, "epoch": 0.09, "percentage": 4.53, "elapsed_time": "0:53:21", "remaining_time": "18:44:25"} +{"current_steps": 320, "total_steps": 7064, "loss": 0.9218, "reward": null, "learning_rate": 4.97472592822397e-05, "epoch": 0.09, "percentage": 4.53, "elapsed_time": "0:53:20", "remaining_time": "18:44:05"} +{"current_steps": 320, "total_steps": 7064, "loss": 0.9218, "reward": null, "learning_rate": 4.97472592822397e-05, "epoch": 0.09, "percentage": 4.53, "elapsed_time": "0:53:22", "remaining_time": "18:44:48"} +{"current_steps": 330, "total_steps": 7064, "loss": 0.9481, "reward": null, "learning_rate": 4.9731244974858746e-05, "epoch": 0.09, "percentage": 4.67, "elapsed_time": "0:58:53", "remaining_time": "20:01:38"} +{"current_steps": 330, "total_steps": 7064, "loss": 0.9481, "reward": null, "learning_rate": 4.9731244974858746e-05, "epoch": 0.09, "percentage": 4.67, "elapsed_time": "0:55:01", "remaining_time": "18:42:58"} +{"current_steps": 330, "total_steps": 7064, "loss": 0.9481, "reward": null, "learning_rate": 4.9731244974858746e-05, "epoch": 0.09, "percentage": 4.67, "elapsed_time": "0:55:00", "remaining_time": "18:42:36"} +{"current_steps": 330, "total_steps": 7064, "loss": 0.9481, "reward": null, "learning_rate": 4.9731244974858746e-05, "epoch": 0.09, "percentage": 4.67, "elapsed_time": "0:54:59", "remaining_time": "18:42:17"} +{"current_steps": 340, "total_steps": 7064, "loss": 0.9508, "reward": null, "learning_rate": 4.971474151570955e-05, "epoch": 0.1, "percentage": 4.81, "elapsed_time": "1:00:34", "remaining_time": "19:58:04"} +{"current_steps": 340, "total_steps": 7064, "loss": 0.9508, "reward": null, "learning_rate": 4.971474151570955e-05, "epoch": 0.1, "percentage": 4.81, "elapsed_time": "0:56:42", "remaining_time": "18:41:28"} +{"current_steps": 340, "total_steps": 7064, "loss": 0.9508, "reward": null, "learning_rate": 4.971474151570955e-05, "epoch": 0.1, "percentage": 4.81, "elapsed_time": "0:56:43", "remaining_time": "18:41:50"} +{"current_steps": 340, "total_steps": 7064, "loss": 0.9508, "reward": null, "learning_rate": 4.971474151570955e-05, "epoch": 0.1, "percentage": 4.81, "elapsed_time": "0:56:41", "remaining_time": "18:41:10"} +{"current_steps": 350, "total_steps": 7064, "loss": 0.9587, "reward": null, "learning_rate": 4.9697749231209025e-05, "epoch": 0.1, "percentage": 4.95, "elapsed_time": "1:02:16", "remaining_time": "19:54:37"} +{"current_steps": 350, "total_steps": 7064, "loss": 0.9587, "reward": null, "learning_rate": 4.9697749231209025e-05, "epoch": 0.1, "percentage": 4.95, "elapsed_time": "0:58:25", "remaining_time": "18:40:40"} +{"current_steps": 350, "total_steps": 7064, "loss": 0.9587, "reward": null, "learning_rate": 4.9697749231209025e-05, "epoch": 0.1, "percentage": 4.95, "elapsed_time": "0:58:24", "remaining_time": "18:40:20"} +{"current_steps": 350, "total_steps": 7064, "loss": 0.9587, "reward": null, "learning_rate": 4.9697749231209025e-05, "epoch": 0.1, "percentage": 4.95, "elapsed_time": "0:58:23", "remaining_time": "18:40:02"} +{"current_steps": 360, "total_steps": 7064, "loss": 0.9371, "reward": null, "learning_rate": 4.968026845744237e-05, "epoch": 0.1, "percentage": 5.1, "elapsed_time": "1:00:04", "remaining_time": "18:38:41"} +{"current_steps": 360, "total_steps": 7064, "loss": 0.9371, "reward": null, "learning_rate": 4.968026845744237e-05, "epoch": 0.1, "percentage": 5.1, "elapsed_time": "1:03:56", "remaining_time": "19:50:49"} +{"current_steps": 360, "total_steps": 7064, "loss": 0.9371, "reward": null, "learning_rate": 4.968026845744237e-05, "epoch": 0.1, "percentage": 5.1, "elapsed_time": "1:00:05", "remaining_time": "18:39:01"} +{"current_steps": 360, "total_steps": 7064, "loss": 0.9371, "reward": null, "learning_rate": 4.968026845744237e-05, "epoch": 0.1, "percentage": 5.1, "elapsed_time": "1:00:03", "remaining_time": "18:38:24"} +{"current_steps": 370, "total_steps": 7064, "loss": 0.9242, "reward": null, "learning_rate": 4.96622995401565e-05, "epoch": 0.1, "percentage": 5.24, "elapsed_time": "1:01:45", "remaining_time": "18:37:21"} +{"current_steps": 370, "total_steps": 7064, "loss": 0.9242, "reward": null, "learning_rate": 4.96622995401565e-05, "epoch": 0.1, "percentage": 5.24, "elapsed_time": "1:01:46", "remaining_time": "18:37:38"} +{"current_steps": 370, "total_steps": 7064, "loss": 0.9242, "reward": null, "learning_rate": 4.96622995401565e-05, "epoch": 0.1, "percentage": 5.24, "elapsed_time": "1:01:47", "remaining_time": "18:37:57"} +{"current_steps": 370, "total_steps": 7064, "loss": 0.9242, "reward": null, "learning_rate": 4.96622995401565e-05, "epoch": 0.1, "percentage": 5.24, "elapsed_time": "1:05:38", "remaining_time": "19:47:42"} +{"current_steps": 380, "total_steps": 7064, "loss": 0.9229, "reward": null, "learning_rate": 4.9643842834753174e-05, "epoch": 0.11, "percentage": 5.38, "elapsed_time": "1:03:25", "remaining_time": "18:35:41"} +{"current_steps": 380, "total_steps": 7064, "loss": 0.9229, "reward": null, "learning_rate": 4.9643842834753174e-05, "epoch": 0.11, "percentage": 5.38, "elapsed_time": "1:03:26", "remaining_time": "18:36:00"} +{"current_steps": 380, "total_steps": 7064, "loss": 0.9229, "reward": null, "learning_rate": 4.9643842834753174e-05, "epoch": 0.11, "percentage": 5.38, "elapsed_time": "1:03:24", "remaining_time": "18:35:25"} +{"current_steps": 380, "total_steps": 7064, "loss": 0.9229, "reward": null, "learning_rate": 4.9643842834753174e-05, "epoch": 0.11, "percentage": 5.38, "elapsed_time": "1:07:18", "remaining_time": "19:43:48"} +{"current_steps": 390, "total_steps": 7064, "loss": 0.9271, "reward": null, "learning_rate": 4.962489870628193e-05, "epoch": 0.11, "percentage": 5.52, "elapsed_time": "1:05:08", "remaining_time": "18:34:53"} +{"current_steps": 390, "total_steps": 7064, "loss": 0.9271, "reward": null, "learning_rate": 4.962489870628193e-05, "epoch": 0.11, "percentage": 5.52, "elapsed_time": "1:05:08", "remaining_time": "18:34:37"} +{"current_steps": 390, "total_steps": 7064, "loss": 0.9271, "reward": null, "learning_rate": 4.962489870628193e-05, "epoch": 0.11, "percentage": 5.52, "elapsed_time": "1:05:10", "remaining_time": "18:35:12"} +{"current_steps": 390, "total_steps": 7064, "loss": 0.9271, "reward": null, "learning_rate": 4.962489870628193e-05, "epoch": 0.11, "percentage": 5.52, "elapsed_time": "1:09:01", "remaining_time": "19:41:10"} +{"current_steps": 400, "total_steps": 7064, "loss": 0.9309, "reward": null, "learning_rate": 4.960546752943294e-05, "epoch": 0.11, "percentage": 5.66, "elapsed_time": "1:06:46", "remaining_time": "18:32:36"} +{"current_steps": 400, "total_steps": 7064, "loss": 0.9309, "reward": null, "learning_rate": 4.960546752943294e-05, "epoch": 0.11, "percentage": 5.66, "elapsed_time": "1:06:46", "remaining_time": "18:32:20"} +{"current_steps": 400, "total_steps": 7064, "loss": 0.9309, "reward": null, "learning_rate": 4.960546752943294e-05, "epoch": 0.11, "percentage": 5.66, "elapsed_time": "1:06:48", "remaining_time": "18:32:54"} +{"current_steps": 400, "total_steps": 7064, "loss": 0.9309, "reward": null, "learning_rate": 4.960546752943294e-05, "epoch": 0.11, "percentage": 5.66, "elapsed_time": "1:10:39", "remaining_time": "19:37:07"} +{"current_steps": 410, "total_steps": 7064, "loss": 0.9102, "reward": null, "learning_rate": 4.958554968852952e-05, "epoch": 0.12, "percentage": 5.8, "elapsed_time": "1:12:21", "remaining_time": "19:34:15"} +{"current_steps": 410, "total_steps": 7064, "loss": 0.9102, "reward": null, "learning_rate": 4.958554968852952e-05, "epoch": 0.12, "percentage": 5.8, "elapsed_time": "1:08:29", "remaining_time": "18:31:41"} +{"current_steps": 410, "total_steps": 7064, "loss": 0.9102, "reward": null, "learning_rate": 4.958554968852952e-05, "epoch": 0.12, "percentage": 5.8, "elapsed_time": "1:08:27", "remaining_time": "18:31:08"} +{"current_steps": 410, "total_steps": 7064, "loss": 0.9102, "reward": null, "learning_rate": 4.958554968852952e-05, "epoch": 0.12, "percentage": 5.8, "elapsed_time": "1:08:28", "remaining_time": "18:31:23"} +{"current_steps": 420, "total_steps": 7064, "loss": 0.9089, "reward": null, "learning_rate": 4.95651455775206e-05, "epoch": 0.12, "percentage": 5.95, "elapsed_time": "1:14:02", "remaining_time": "19:31:10"} +{"current_steps": 420, "total_steps": 7064, "loss": 0.9089, "reward": null, "learning_rate": 4.95651455775206e-05, "epoch": 0.12, "percentage": 5.95, "elapsed_time": "1:10:10", "remaining_time": "18:30:11"} +{"current_steps": 420, "total_steps": 7064, "loss": 0.9089, "reward": null, "learning_rate": 4.95651455775206e-05, "epoch": 0.12, "percentage": 5.95, "elapsed_time": "1:10:09", "remaining_time": "18:29:54"} +{"current_steps": 420, "total_steps": 7064, "loss": 0.9089, "reward": null, "learning_rate": 4.95651455775206e-05, "epoch": 0.12, "percentage": 5.95, "elapsed_time": "1:10:08", "remaining_time": "18:29:39"} +{"current_steps": 430, "total_steps": 7064, "loss": 0.9236, "reward": null, "learning_rate": 4.954425559997287e-05, "epoch": 0.12, "percentage": 6.09, "elapsed_time": "1:15:44", "remaining_time": "19:28:33"} +{"current_steps": 430, "total_steps": 7064, "loss": 0.9236, "reward": null, "learning_rate": 4.954425559997287e-05, "epoch": 0.12, "percentage": 6.09, "elapsed_time": "1:11:51", "remaining_time": "18:28:33"} +{"current_steps": 430, "total_steps": 7064, "loss": 0.9236, "reward": null, "learning_rate": 4.954425559997287e-05, "epoch": 0.12, "percentage": 6.09, "elapsed_time": "1:11:53", "remaining_time": "18:29:04"} +{"current_steps": 430, "total_steps": 7064, "loss": 0.9236, "reward": null, "learning_rate": 4.954425559997287e-05, "epoch": 0.12, "percentage": 6.09, "elapsed_time": "1:11:52", "remaining_time": "18:28:47"} +{"current_steps": 440, "total_steps": 7064, "loss": 0.9184, "reward": null, "learning_rate": 4.952288016906284e-05, "epoch": 0.12, "percentage": 6.23, "elapsed_time": "1:13:30", "remaining_time": "18:26:32"} +{"current_steps": 440, "total_steps": 7064, "loss": 0.9184, "reward": null, "learning_rate": 4.952288016906284e-05, "epoch": 0.12, "percentage": 6.23, "elapsed_time": "1:13:32", "remaining_time": "18:27:03"} +{"current_steps": 440, "total_steps": 7064, "loss": 0.9184, "reward": null, "learning_rate": 4.952288016906284e-05, "epoch": 0.12, "percentage": 6.23, "elapsed_time": "1:13:31", "remaining_time": "18:26:46"} +{"current_steps": 440, "total_steps": 7064, "loss": 0.9184, "reward": null, "learning_rate": 4.952288016906284e-05, "epoch": 0.12, "percentage": 6.23, "elapsed_time": "1:17:23", "remaining_time": "19:25:05"} +{"current_steps": 450, "total_steps": 7064, "loss": 0.9112, "reward": null, "learning_rate": 4.9501019707568665e-05, "epoch": 0.13, "percentage": 6.37, "elapsed_time": "1:15:13", "remaining_time": "18:25:40"} +{"current_steps": 450, "total_steps": 7064, "loss": 0.9112, "reward": null, "learning_rate": 4.9501019707568665e-05, "epoch": 0.13, "percentage": 6.37, "elapsed_time": "1:15:12", "remaining_time": "18:25:24"} +{"current_steps": 450, "total_steps": 7064, "loss": 0.9112, "reward": null, "learning_rate": 4.9501019707568665e-05, "epoch": 0.13, "percentage": 6.37, "elapsed_time": "1:15:11", "remaining_time": "18:25:10"} +{"current_steps": 450, "total_steps": 7064, "loss": 0.9112, "reward": null, "learning_rate": 4.9501019707568665e-05, "epoch": 0.13, "percentage": 6.37, "elapsed_time": "1:19:04", "remaining_time": "19:22:19"} +{"current_steps": 460, "total_steps": 7064, "loss": 0.9178, "reward": null, "learning_rate": 4.947867464786174e-05, "epoch": 0.13, "percentage": 6.51, "elapsed_time": "1:16:53", "remaining_time": "18:23:46"} +{"current_steps": 460, "total_steps": 7064, "loss": 0.9178, "reward": null, "learning_rate": 4.947867464786174e-05, "epoch": 0.13, "percentage": 6.51, "elapsed_time": "1:16:54", "remaining_time": "18:24:02"} +{"current_steps": 460, "total_steps": 7064, "loss": 0.9178, "reward": null, "learning_rate": 4.947867464786174e-05, "epoch": 0.13, "percentage": 6.51, "elapsed_time": "1:16:52", "remaining_time": "18:23:33"} +{"current_steps": 460, "total_steps": 7064, "loss": 0.9178, "reward": null, "learning_rate": 4.947867464786174e-05, "epoch": 0.13, "percentage": 6.51, "elapsed_time": "1:20:45", "remaining_time": "19:19:23"} +{"current_steps": 470, "total_steps": 7064, "loss": 0.9364, "reward": null, "learning_rate": 4.945584543189823e-05, "epoch": 0.13, "percentage": 6.65, "elapsed_time": "1:22:25", "remaining_time": "19:16:20"} +{"current_steps": 470, "total_steps": 7064, "loss": 0.9364, "reward": null, "learning_rate": 4.945584543189823e-05, "epoch": 0.13, "percentage": 6.65, "elapsed_time": "1:18:31", "remaining_time": "18:21:47"} +{"current_steps": 470, "total_steps": 7064, "loss": 0.9364, "reward": null, "learning_rate": 4.945584543189823e-05, "epoch": 0.13, "percentage": 6.65, "elapsed_time": "1:18:32", "remaining_time": "18:22:00"} +{"current_steps": 470, "total_steps": 7064, "loss": 0.9364, "reward": null, "learning_rate": 4.945584543189823e-05, "epoch": 0.13, "percentage": 6.65, "elapsed_time": "1:18:33", "remaining_time": "18:22:15"} +{"current_steps": 480, "total_steps": 7064, "loss": 0.9262, "reward": null, "learning_rate": 4.943253251121022e-05, "epoch": 0.14, "percentage": 6.8, "elapsed_time": "1:24:05", "remaining_time": "19:13:29"} +{"current_steps": 480, "total_steps": 7064, "loss": 0.9262, "reward": null, "learning_rate": 4.943253251121022e-05, "epoch": 0.14, "percentage": 6.8, "elapsed_time": "1:20:14", "remaining_time": "18:20:37"} +{"current_steps": 480, "total_steps": 7064, "loss": 0.9262, "reward": null, "learning_rate": 4.943253251121022e-05, "epoch": 0.14, "percentage": 6.8, "elapsed_time": "1:20:13", "remaining_time": "18:20:22"} +{"current_steps": 480, "total_steps": 7064, "loss": 0.9262, "reward": null, "learning_rate": 4.943253251121022e-05, "epoch": 0.14, "percentage": 6.8, "elapsed_time": "1:20:12", "remaining_time": "18:20:09"} +{"current_steps": 490, "total_steps": 7064, "loss": 0.9037, "reward": null, "learning_rate": 4.9408736346896894e-05, "epoch": 0.14, "percentage": 6.94, "elapsed_time": "1:25:48", "remaining_time": "19:11:20"} +{"current_steps": 490, "total_steps": 7064, "loss": 0.9037, "reward": null, "learning_rate": 4.9408736346896894e-05, "epoch": 0.14, "percentage": 6.94, "elapsed_time": "1:21:56", "remaining_time": "18:19:22"} +{"current_steps": 490, "total_steps": 7064, "loss": 0.9037, "reward": null, "learning_rate": 4.9408736346896894e-05, "epoch": 0.14, "percentage": 6.94, "elapsed_time": "1:21:55", "remaining_time": "18:19:10"} +{"current_steps": 490, "total_steps": 7064, "loss": 0.9037, "reward": null, "learning_rate": 4.9408736346896894e-05, "epoch": 0.14, "percentage": 6.94, "elapsed_time": "1:21:57", "remaining_time": "18:19:37"} +{"current_steps": 500, "total_steps": 7064, "loss": 0.928, "reward": null, "learning_rate": 4.938445740961534e-05, "epoch": 0.14, "percentage": 7.08, "elapsed_time": "1:27:34", "remaining_time": "19:09:40"} +{"current_steps": 500, "total_steps": 7064, "loss": 0.928, "reward": null, "learning_rate": 4.938445740961534e-05, "epoch": 0.14, "percentage": 7.08, "elapsed_time": "1:23:43", "remaining_time": "18:19:04"} +{"current_steps": 500, "total_steps": 7064, "loss": 0.928, "reward": null, "learning_rate": 4.938445740961534e-05, "epoch": 0.14, "percentage": 7.08, "elapsed_time": "1:23:42", "remaining_time": "18:18:49"} +{"current_steps": 500, "total_steps": 7064, "loss": 0.928, "reward": null, "learning_rate": 4.938445740961534e-05, "epoch": 0.14, "percentage": 7.08, "elapsed_time": "1:23:41", "remaining_time": "18:18:37"} +{"current_steps": 510, "total_steps": 7064, "loss": 0.9064, "reward": null, "learning_rate": 4.935969617957126e-05, "epoch": 0.14, "percentage": 7.22, "elapsed_time": "1:25:28", "remaining_time": "18:18:25"} +{"current_steps": 510, "total_steps": 7064, "loss": 0.9064, "reward": null, "learning_rate": 4.935969617957126e-05, "epoch": 0.14, "percentage": 7.22, "elapsed_time": "1:25:29", "remaining_time": "18:18:39"} +{"current_steps": 510, "total_steps": 7064, "loss": 0.9064, "reward": null, "learning_rate": 4.935969617957126e-05, "epoch": 0.14, "percentage": 7.22, "elapsed_time": "1:25:27", "remaining_time": "18:18:13"} +{"current_steps": 510, "total_steps": 7064, "loss": 0.9064, "reward": null, "learning_rate": 4.935969617957126e-05, "epoch": 0.14, "percentage": 7.22, "elapsed_time": "1:29:20", "remaining_time": "19:08:11"} +{"current_steps": 520, "total_steps": 7064, "loss": 0.9107, "reward": null, "learning_rate": 4.93344531465095e-05, "epoch": 0.15, "percentage": 7.36, "elapsed_time": "1:31:01", "remaining_time": "19:05:26"} +{"current_steps": 520, "total_steps": 7064, "loss": 0.9107, "reward": null, "learning_rate": 4.93344531465095e-05, "epoch": 0.15, "percentage": 7.36, "elapsed_time": "1:27:09", "remaining_time": "18:16:55"} +{"current_steps": 520, "total_steps": 7064, "loss": 0.9107, "reward": null, "learning_rate": 4.93344531465095e-05, "epoch": 0.15, "percentage": 7.36, "elapsed_time": "1:27:08", "remaining_time": "18:16:41"} +{"current_steps": 520, "total_steps": 7064, "loss": 0.9107, "reward": null, "learning_rate": 4.93344531465095e-05, "epoch": 0.15, "percentage": 7.36, "elapsed_time": "1:27:07", "remaining_time": "18:16:29"} +{"current_steps": 530, "total_steps": 7064, "loss": 0.905, "reward": null, "learning_rate": 4.930872880970432e-05, "epoch": 0.15, "percentage": 7.5, "elapsed_time": "1:32:39", "remaining_time": "19:02:20"} +{"current_steps": 530, "total_steps": 7064, "loss": 0.905, "reward": null, "learning_rate": 4.930872880970432e-05, "epoch": 0.15, "percentage": 7.5, "elapsed_time": "1:28:48", "remaining_time": "18:14:49"} +{"current_steps": 530, "total_steps": 7064, "loss": 0.905, "reward": null, "learning_rate": 4.930872880970432e-05, "epoch": 0.15, "percentage": 7.5, "elapsed_time": "1:28:47", "remaining_time": "18:14:36"} +{"current_steps": 530, "total_steps": 7064, "loss": 0.905, "reward": null, "learning_rate": 4.930872880970432e-05, "epoch": 0.15, "percentage": 7.5, "elapsed_time": "1:28:46", "remaining_time": "18:14:24"} +{"current_steps": 540, "total_steps": 7064, "loss": 0.9234, "reward": null, "learning_rate": 4.9282523677949556e-05, "epoch": 0.15, "percentage": 7.64, "elapsed_time": "1:34:17", "remaining_time": "18:59:16"} +{"current_steps": 540, "total_steps": 7064, "loss": 0.9234, "reward": null, "learning_rate": 4.9282523677949556e-05, "epoch": 0.15, "percentage": 7.64, "elapsed_time": "1:30:25", "remaining_time": "18:12:28"} +{"current_steps": 540, "total_steps": 7064, "loss": 0.9234, "reward": null, "learning_rate": 4.9282523677949556e-05, "epoch": 0.15, "percentage": 7.64, "elapsed_time": "1:30:26", "remaining_time": "18:12:41"} +{"current_steps": 540, "total_steps": 7064, "loss": 0.9234, "reward": null, "learning_rate": 4.9282523677949556e-05, "epoch": 0.15, "percentage": 7.64, "elapsed_time": "1:30:24", "remaining_time": "18:12:17"} +{"current_steps": 550, "total_steps": 7064, "loss": 0.906, "reward": null, "learning_rate": 4.9255838269548524e-05, "epoch": 0.16, "percentage": 7.79, "elapsed_time": "1:36:00", "remaining_time": "18:57:04"} +{"current_steps": 550, "total_steps": 7064, "loss": 0.906, "reward": null, "learning_rate": 4.9255838269548524e-05, "epoch": 0.16, "percentage": 7.79, "elapsed_time": "1:32:09", "remaining_time": "18:11:25"} +{"current_steps": 550, "total_steps": 7064, "loss": 0.906, "reward": null, "learning_rate": 4.9255838269548524e-05, "epoch": 0.16, "percentage": 7.79, "elapsed_time": "1:32:08", "remaining_time": "18:11:12"} +{"current_steps": 550, "total_steps": 7064, "loss": 0.906, "reward": null, "learning_rate": 4.9255838269548524e-05, "epoch": 0.16, "percentage": 7.79, "elapsed_time": "1:32:07", "remaining_time": "18:11:01"} +{"current_steps": 560, "total_steps": 7064, "loss": 0.8885, "reward": null, "learning_rate": 4.9228673112303814e-05, "epoch": 0.16, "percentage": 7.93, "elapsed_time": "1:37:42", "remaining_time": "18:54:51"} +{"current_steps": 560, "total_steps": 7064, "loss": 0.8885, "reward": null, "learning_rate": 4.9228673112303814e-05, "epoch": 0.16, "percentage": 7.93, "elapsed_time": "1:33:50", "remaining_time": "18:09:52"} +{"current_steps": 560, "total_steps": 7064, "loss": 0.8885, "reward": null, "learning_rate": 4.9228673112303814e-05, "epoch": 0.16, "percentage": 7.93, "elapsed_time": "1:33:49", "remaining_time": "18:09:42"} +{"current_steps": 560, "total_steps": 7064, "loss": 0.8885, "reward": null, "learning_rate": 4.9228673112303814e-05, "epoch": 0.16, "percentage": 7.93, "elapsed_time": "1:33:51", "remaining_time": "18:10:05"} +{"current_steps": 570, "total_steps": 7064, "loss": 0.9103, "reward": null, "learning_rate": 4.9201028743506794e-05, "epoch": 0.16, "percentage": 8.07, "elapsed_time": "1:39:21", "remaining_time": "18:51:54"} +{"current_steps": 570, "total_steps": 7064, "loss": 0.9103, "reward": null, "learning_rate": 4.9201028743506794e-05, "epoch": 0.16, "percentage": 8.07, "elapsed_time": "1:35:28", "remaining_time": "18:07:47"} +{"current_steps": 570, "total_steps": 7064, "loss": 0.9103, "reward": null, "learning_rate": 4.9201028743506794e-05, "epoch": 0.16, "percentage": 8.07, "elapsed_time": "1:35:27", "remaining_time": "18:07:36"} +{"current_steps": 570, "total_steps": 7064, "loss": 0.9103, "reward": null, "learning_rate": 4.9201028743506794e-05, "epoch": 0.16, "percentage": 8.07, "elapsed_time": "1:35:29", "remaining_time": "18:07:59"} +{"current_steps": 580, "total_steps": 7064, "loss": 0.895, "reward": null, "learning_rate": 4.917290570992702e-05, "epoch": 0.16, "percentage": 8.21, "elapsed_time": "1:41:01", "remaining_time": "18:49:22"} +{"current_steps": 580, "total_steps": 7064, "loss": 0.895, "reward": null, "learning_rate": 4.917290570992702e-05, "epoch": 0.16, "percentage": 8.21, "elapsed_time": "1:37:09", "remaining_time": "18:06:04"} +{"current_steps": 580, "total_steps": 7064, "loss": 0.895, "reward": null, "learning_rate": 4.917290570992702e-05, "epoch": 0.16, "percentage": 8.21, "elapsed_time": "1:37:08", "remaining_time": "18:05:53"} +{"current_steps": 580, "total_steps": 7064, "loss": 0.895, "reward": null, "learning_rate": 4.917290570992702e-05, "epoch": 0.16, "percentage": 8.21, "elapsed_time": "1:37:10", "remaining_time": "18:06:16"} +{"current_steps": 590, "total_steps": 7064, "loss": 0.8948, "reward": null, "learning_rate": 4.9144304567801415e-05, "epoch": 0.17, "percentage": 8.35, "elapsed_time": "1:38:45", "remaining_time": "18:03:36"} +{"current_steps": 590, "total_steps": 7064, "loss": 0.8948, "reward": null, "learning_rate": 4.9144304567801415e-05, "epoch": 0.17, "percentage": 8.35, "elapsed_time": "1:42:37", "remaining_time": "18:46:06"} +{"current_steps": 590, "total_steps": 7064, "loss": 0.8948, "reward": null, "learning_rate": 4.9144304567801415e-05, "epoch": 0.17, "percentage": 8.35, "elapsed_time": "1:38:46", "remaining_time": "18:03:48"} +{"current_steps": 590, "total_steps": 7064, "loss": 0.8948, "reward": null, "learning_rate": 4.9144304567801415e-05, "epoch": 0.17, "percentage": 8.35, "elapsed_time": "1:38:44", "remaining_time": "18:03:25"} +{"current_steps": 600, "total_steps": 7064, "loss": 0.9109, "reward": null, "learning_rate": 4.911522588282327e-05, "epoch": 0.17, "percentage": 8.49, "elapsed_time": "1:44:19", "remaining_time": "18:43:59"} +{"current_steps": 600, "total_steps": 7064, "loss": 0.9109, "reward": null, "learning_rate": 4.911522588282327e-05, "epoch": 0.17, "percentage": 8.49, "elapsed_time": "1:40:28", "remaining_time": "18:02:28"} +{"current_steps": 600, "total_steps": 7064, "loss": 0.9109, "reward": null, "learning_rate": 4.911522588282327e-05, "epoch": 0.17, "percentage": 8.49, "elapsed_time": "1:40:27", "remaining_time": "18:02:16"} +{"current_steps": 600, "total_steps": 7064, "loss": 0.9109, "reward": null, "learning_rate": 4.911522588282327e-05, "epoch": 0.17, "percentage": 8.49, "elapsed_time": "1:40:26", "remaining_time": "18:02:06"} +{"current_steps": 610, "total_steps": 7064, "loss": 0.8914, "reward": null, "learning_rate": 4.908567023013104e-05, "epoch": 0.17, "percentage": 8.64, "elapsed_time": "1:42:08", "remaining_time": "18:00:45"} +{"current_steps": 610, "total_steps": 7064, "loss": 0.8914, "reward": null, "learning_rate": 4.908567023013104e-05, "epoch": 0.17, "percentage": 8.64, "elapsed_time": "1:42:06", "remaining_time": "18:00:23"} +{"current_steps": 610, "total_steps": 7064, "loss": 0.8914, "reward": null, "learning_rate": 4.908567023013104e-05, "epoch": 0.17, "percentage": 8.64, "elapsed_time": "1:42:07", "remaining_time": "18:00:33"} +{"current_steps": 610, "total_steps": 7064, "loss": 0.8914, "reward": null, "learning_rate": 4.908567023013104e-05, "epoch": 0.17, "percentage": 8.64, "elapsed_time": "1:46:00", "remaining_time": "18:41:32"} +{"current_steps": 620, "total_steps": 7064, "loss": 0.892, "reward": null, "learning_rate": 4.9055638194296994e-05, "epoch": 0.18, "percentage": 8.78, "elapsed_time": "1:43:48", "remaining_time": "17:58:56"} +{"current_steps": 620, "total_steps": 7064, "loss": 0.892, "reward": null, "learning_rate": 4.9055638194296994e-05, "epoch": 0.18, "percentage": 8.78, "elapsed_time": "1:43:49", "remaining_time": "17:59:07"} +{"current_steps": 620, "total_steps": 7064, "loss": 0.892, "reward": null, "learning_rate": 4.9055638194296994e-05, "epoch": 0.18, "percentage": 8.78, "elapsed_time": "1:43:47", "remaining_time": "17:58:46"} +{"current_steps": 620, "total_steps": 7064, "loss": 0.892, "reward": null, "learning_rate": 4.9055638194296994e-05, "epoch": 0.18, "percentage": 8.78, "elapsed_time": "1:47:40", "remaining_time": "18:39:11"} +{"current_steps": 630, "total_steps": 7064, "loss": 0.9049, "reward": null, "learning_rate": 4.902513036931562e-05, "epoch": 0.18, "percentage": 8.92, "elapsed_time": "1:49:21", "remaining_time": "18:36:48"} +{"current_steps": 630, "total_steps": 7064, "loss": 0.9049, "reward": null, "learning_rate": 4.902513036931562e-05, "epoch": 0.18, "percentage": 8.92, "elapsed_time": "1:45:27", "remaining_time": "17:57:05"} +{"current_steps": 630, "total_steps": 7064, "loss": 0.9049, "reward": null, "learning_rate": 4.902513036931562e-05, "epoch": 0.18, "percentage": 8.92, "elapsed_time": "1:45:28", "remaining_time": "17:57:15"} +{"current_steps": 630, "total_steps": 7064, "loss": 0.9049, "reward": null, "learning_rate": 4.902513036931562e-05, "epoch": 0.18, "percentage": 8.92, "elapsed_time": "1:45:30", "remaining_time": "17:57:26"} +{"current_steps": 640, "total_steps": 7064, "loss": 0.904, "reward": null, "learning_rate": 4.89941473585919e-05, "epoch": 0.18, "percentage": 9.06, "elapsed_time": "1:47:08", "remaining_time": "17:55:23"} +{"current_steps": 640, "total_steps": 7064, "loss": 0.904, "reward": null, "learning_rate": 4.89941473585919e-05, "epoch": 0.18, "percentage": 9.06, "elapsed_time": "1:47:06", "remaining_time": "17:55:03"} +{"current_steps": 640, "total_steps": 7064, "loss": 0.904, "reward": null, "learning_rate": 4.89941473585919e-05, "epoch": 0.18, "percentage": 9.06, "elapsed_time": "1:47:07", "remaining_time": "17:55:12"} +{"current_steps": 640, "total_steps": 7064, "loss": 0.904, "reward": null, "learning_rate": 4.89941473585919e-05, "epoch": 0.18, "percentage": 9.06, "elapsed_time": "1:50:59", "remaining_time": "18:34:05"} +{"current_steps": 650, "total_steps": 7064, "loss": 0.8983, "reward": null, "learning_rate": 4.89626897749294e-05, "epoch": 0.18, "percentage": 9.2, "elapsed_time": "1:52:41", "remaining_time": "18:32:03"} +{"current_steps": 650, "total_steps": 7064, "loss": 0.8983, "reward": null, "learning_rate": 4.89626897749294e-05, "epoch": 0.18, "percentage": 9.2, "elapsed_time": "1:48:49", "remaining_time": "17:53:50"} +{"current_steps": 650, "total_steps": 7064, "loss": 0.8983, "reward": null, "learning_rate": 4.89626897749294e-05, "epoch": 0.18, "percentage": 9.2, "elapsed_time": "1:48:50", "remaining_time": "17:54:01"} +{"current_steps": 650, "total_steps": 7064, "loss": 0.8983, "reward": null, "learning_rate": 4.89626897749294e-05, "epoch": 0.18, "percentage": 9.2, "elapsed_time": "1:48:48", "remaining_time": "17:53:41"} +{"current_steps": 660, "total_steps": 7064, "loss": 0.8884, "reward": null, "learning_rate": 4.893075824051807e-05, "epoch": 0.19, "percentage": 9.34, "elapsed_time": "1:54:22", "remaining_time": "18:29:45"} +{"current_steps": 660, "total_steps": 7064, "loss": 0.8884, "reward": null, "learning_rate": 4.893075824051807e-05, "epoch": 0.19, "percentage": 9.34, "elapsed_time": "1:50:29", "remaining_time": "17:52:10"} +{"current_steps": 660, "total_steps": 7064, "loss": 0.8884, "reward": null, "learning_rate": 4.893075824051807e-05, "epoch": 0.19, "percentage": 9.34, "elapsed_time": "1:50:28", "remaining_time": "17:52:01"} +{"current_steps": 660, "total_steps": 7064, "loss": 0.8884, "reward": null, "learning_rate": 4.893075824051807e-05, "epoch": 0.19, "percentage": 9.34, "elapsed_time": "1:50:31", "remaining_time": "17:52:20"} +{"current_steps": 670, "total_steps": 7064, "loss": 0.8886, "reward": null, "learning_rate": 4.889835338692201e-05, "epoch": 0.19, "percentage": 9.48, "elapsed_time": "1:56:01", "remaining_time": "18:27:16"} +{"current_steps": 670, "total_steps": 7064, "loss": 0.8886, "reward": null, "learning_rate": 4.889835338692201e-05, "epoch": 0.19, "percentage": 9.48, "elapsed_time": "1:52:10", "remaining_time": "17:50:29"} +{"current_steps": 670, "total_steps": 7064, "loss": 0.8886, "reward": null, "learning_rate": 4.889835338692201e-05, "epoch": 0.19, "percentage": 9.48, "elapsed_time": "1:52:09", "remaining_time": "17:50:18"} +{"current_steps": 670, "total_steps": 7064, "loss": 0.8886, "reward": null, "learning_rate": 4.889835338692201e-05, "epoch": 0.19, "percentage": 9.48, "elapsed_time": "1:52:08", "remaining_time": "17:50:10"} +{"current_steps": 680, "total_steps": 7064, "loss": 0.8998, "reward": null, "learning_rate": 4.886547585506698e-05, "epoch": 0.19, "percentage": 9.63, "elapsed_time": "1:57:45", "remaining_time": "18:25:31"} +{"current_steps": 680, "total_steps": 7064, "loss": 0.8998, "reward": null, "learning_rate": 4.886547585506698e-05, "epoch": 0.19, "percentage": 9.63, "elapsed_time": "1:53:52", "remaining_time": "17:49:01"} +{"current_steps": 680, "total_steps": 7064, "loss": 0.8998, "reward": null, "learning_rate": 4.886547585506698e-05, "epoch": 0.19, "percentage": 9.63, "elapsed_time": "1:53:53", "remaining_time": "17:49:10"} +{"current_steps": 680, "total_steps": 7064, "loss": 0.8998, "reward": null, "learning_rate": 4.886547585506698e-05, "epoch": 0.19, "percentage": 9.63, "elapsed_time": "1:53:54", "remaining_time": "17:49:20"} +{"current_steps": 690, "total_steps": 7064, "loss": 0.8753, "reward": null, "learning_rate": 4.8832126295227656e-05, "epoch": 0.2, "percentage": 9.77, "elapsed_time": "1:59:26", "remaining_time": "18:23:24"} +{"current_steps": 690, "total_steps": 7064, "loss": 0.8753, "reward": null, "learning_rate": 4.8832126295227656e-05, "epoch": 0.2, "percentage": 9.77, "elapsed_time": "1:55:35", "remaining_time": "17:47:47"} +{"current_steps": 690, "total_steps": 7064, "loss": 0.8753, "reward": null, "learning_rate": 4.8832126295227656e-05, "epoch": 0.2, "percentage": 9.77, "elapsed_time": "1:55:34", "remaining_time": "17:47:37"} +{"current_steps": 690, "total_steps": 7064, "loss": 0.8753, "reward": null, "learning_rate": 4.8832126295227656e-05, "epoch": 0.2, "percentage": 9.77, "elapsed_time": "1:55:33", "remaining_time": "17:47:29"} +{"current_steps": 700, "total_steps": 7064, "loss": 0.8937, "reward": null, "learning_rate": 4.879830536701485e-05, "epoch": 0.2, "percentage": 9.91, "elapsed_time": "2:01:09", "remaining_time": "18:21:28"} +{"current_steps": 700, "total_steps": 7064, "loss": 0.8937, "reward": null, "learning_rate": 4.879830536701485e-05, "epoch": 0.2, "percentage": 9.91, "elapsed_time": "1:57:16", "remaining_time": "17:46:15"} +{"current_steps": 700, "total_steps": 7064, "loss": 0.8937, "reward": null, "learning_rate": 4.879830536701485e-05, "epoch": 0.2, "percentage": 9.91, "elapsed_time": "1:57:18", "remaining_time": "17:46:25"} +{"current_steps": 700, "total_steps": 7064, "loss": 0.8937, "reward": null, "learning_rate": 4.879830536701485e-05, "epoch": 0.2, "percentage": 9.91, "elapsed_time": "1:57:15", "remaining_time": "17:46:07"} +{"current_steps": 710, "total_steps": 7064, "loss": 0.8921, "reward": null, "learning_rate": 4.876401373936239e-05, "epoch": 0.2, "percentage": 10.05, "elapsed_time": "2:02:50", "remaining_time": "18:19:18"} +{"current_steps": 710, "total_steps": 7064, "loss": 0.8921, "reward": null, "learning_rate": 4.876401373936239e-05, "epoch": 0.2, "percentage": 10.05, "elapsed_time": "1:58:57", "remaining_time": "17:44:39"} +{"current_steps": 710, "total_steps": 7064, "loss": 0.8921, "reward": null, "learning_rate": 4.876401373936239e-05, "epoch": 0.2, "percentage": 10.05, "elapsed_time": "1:58:59", "remaining_time": "17:44:49"} +{"current_steps": 710, "total_steps": 7064, "loss": 0.8921, "reward": null, "learning_rate": 4.876401373936239e-05, "epoch": 0.2, "percentage": 10.05, "elapsed_time": "1:58:56", "remaining_time": "17:44:30"} +{"current_steps": 720, "total_steps": 7064, "loss": 0.8801, "reward": null, "learning_rate": 4.8729252090513964e-05, "epoch": 0.2, "percentage": 10.19, "elapsed_time": "2:04:32", "remaining_time": "18:17:19"} +{"current_steps": 720, "total_steps": 7064, "loss": 0.8801, "reward": null, "learning_rate": 4.8729252090513964e-05, "epoch": 0.2, "percentage": 10.19, "elapsed_time": "2:00:41", "remaining_time": "17:43:21"} +{"current_steps": 720, "total_steps": 7064, "loss": 0.8801, "reward": null, "learning_rate": 4.8729252090513964e-05, "epoch": 0.2, "percentage": 10.19, "elapsed_time": "2:00:39", "remaining_time": "17:43:12"} +{"current_steps": 720, "total_steps": 7064, "loss": 0.8801, "reward": null, "learning_rate": 4.8729252090513964e-05, "epoch": 0.2, "percentage": 10.19, "elapsed_time": "2:00:39", "remaining_time": "17:43:04"} +{"current_steps": 730, "total_steps": 7064, "loss": 0.8887, "reward": null, "learning_rate": 4.869402110800963e-05, "epoch": 0.21, "percentage": 10.33, "elapsed_time": "2:02:21", "remaining_time": "17:41:41"} +{"current_steps": 730, "total_steps": 7064, "loss": 0.8887, "reward": null, "learning_rate": 4.869402110800963e-05, "epoch": 0.21, "percentage": 10.33, "elapsed_time": "2:06:14", "remaining_time": "18:15:25"} +{"current_steps": 730, "total_steps": 7064, "loss": 0.8887, "reward": null, "learning_rate": 4.869402110800963e-05, "epoch": 0.21, "percentage": 10.33, "elapsed_time": "2:02:23", "remaining_time": "17:41:58"} +{"current_steps": 730, "total_steps": 7064, "loss": 0.8887, "reward": null, "learning_rate": 4.869402110800963e-05, "epoch": 0.21, "percentage": 10.33, "elapsed_time": "2:02:22", "remaining_time": "17:41:49"} +{"current_steps": 740, "total_steps": 7064, "loss": 0.8793, "reward": null, "learning_rate": 4.865832148867228e-05, "epoch": 0.21, "percentage": 10.48, "elapsed_time": "2:04:00", "remaining_time": "17:39:47"} +{"current_steps": 740, "total_steps": 7064, "loss": 0.8793, "reward": null, "learning_rate": 4.865832148867228e-05, "epoch": 0.21, "percentage": 10.48, "elapsed_time": "2:04:01", "remaining_time": "17:39:56"} +{"current_steps": 740, "total_steps": 7064, "loss": 0.8793, "reward": null, "learning_rate": 4.865832148867228e-05, "epoch": 0.21, "percentage": 10.48, "elapsed_time": "2:03:59", "remaining_time": "17:39:39"} +{"current_steps": 740, "total_steps": 7064, "loss": 0.8793, "reward": null, "learning_rate": 4.865832148867228e-05, "epoch": 0.21, "percentage": 10.48, "elapsed_time": "2:07:53", "remaining_time": "18:12:53"} +{"current_steps": 750, "total_steps": 7064, "loss": 0.8811, "reward": null, "learning_rate": 4.8622153938593816e-05, "epoch": 0.21, "percentage": 10.62, "elapsed_time": "2:09:35", "remaining_time": "18:11:00"} +{"current_steps": 750, "total_steps": 7064, "loss": 0.8811, "reward": null, "learning_rate": 4.8622153938593816e-05, "epoch": 0.21, "percentage": 10.62, "elapsed_time": "2:05:42", "remaining_time": "17:38:16"} +{"current_steps": 750, "total_steps": 7064, "loss": 0.8811, "reward": null, "learning_rate": 4.8622153938593816e-05, "epoch": 0.21, "percentage": 10.62, "elapsed_time": "2:05:43", "remaining_time": "17:38:24"} +{"current_steps": 750, "total_steps": 7064, "loss": 0.8811, "reward": null, "learning_rate": 4.8622153938593816e-05, "epoch": 0.21, "percentage": 10.62, "elapsed_time": "2:05:44", "remaining_time": "17:38:33"} +{"current_steps": 760, "total_steps": 7064, "loss": 0.8924, "reward": null, "learning_rate": 4.8585519173121205e-05, "epoch": 0.22, "percentage": 10.76, "elapsed_time": "2:07:24", "remaining_time": "17:36:48"} +{"current_steps": 760, "total_steps": 7064, "loss": 0.8924, "reward": null, "learning_rate": 4.8585519173121205e-05, "epoch": 0.22, "percentage": 10.76, "elapsed_time": "2:07:26", "remaining_time": "17:37:04"} +{"current_steps": 760, "total_steps": 7064, "loss": 0.8924, "reward": null, "learning_rate": 4.8585519173121205e-05, "epoch": 0.22, "percentage": 10.76, "elapsed_time": "2:07:25", "remaining_time": "17:36:55"} +{"current_steps": 760, "total_steps": 7064, "loss": 0.8924, "reward": null, "learning_rate": 4.8585519173121205e-05, "epoch": 0.22, "percentage": 10.76, "elapsed_time": "2:11:17", "remaining_time": "18:09:03"} +{"current_steps": 770, "total_steps": 7064, "loss": 0.8988, "reward": null, "learning_rate": 4.8548417916842324e-05, "epoch": 0.22, "percentage": 10.9, "elapsed_time": "2:12:55", "remaining_time": "18:06:33"} +{"current_steps": 770, "total_steps": 7064, "loss": 0.8988, "reward": null, "learning_rate": 4.8548417916842324e-05, "epoch": 0.22, "percentage": 10.9, "elapsed_time": "2:09:04", "remaining_time": "17:35:02"} +{"current_steps": 770, "total_steps": 7064, "loss": 0.8988, "reward": null, "learning_rate": 4.8548417916842324e-05, "epoch": 0.22, "percentage": 10.9, "elapsed_time": "2:09:03", "remaining_time": "17:34:53"} +{"current_steps": 770, "total_steps": 7064, "loss": 0.8988, "reward": null, "learning_rate": 4.8548417916842324e-05, "epoch": 0.22, "percentage": 10.9, "elapsed_time": "2:09:02", "remaining_time": "17:34:46"} +{"current_steps": 780, "total_steps": 7064, "loss": 0.8907, "reward": null, "learning_rate": 4.851085090357163e-05, "epoch": 0.22, "percentage": 11.04, "elapsed_time": "2:14:39", "remaining_time": "18:04:48"} +{"current_steps": 780, "total_steps": 7064, "loss": 0.8907, "reward": null, "learning_rate": 4.851085090357163e-05, "epoch": 0.22, "percentage": 11.04, "elapsed_time": "2:10:47", "remaining_time": "17:33:45"} +{"current_steps": 780, "total_steps": 7064, "loss": 0.8907, "reward": null, "learning_rate": 4.851085090357163e-05, "epoch": 0.22, "percentage": 11.04, "elapsed_time": "2:10:46", "remaining_time": "17:33:36"} +{"current_steps": 780, "total_steps": 7064, "loss": 0.8907, "reward": null, "learning_rate": 4.851085090357163e-05, "epoch": 0.22, "percentage": 11.04, "elapsed_time": "2:10:45", "remaining_time": "17:33:29"} +{"current_steps": 790, "total_steps": 7064, "loss": 0.8879, "reward": null, "learning_rate": 4.847281887633565e-05, "epoch": 0.22, "percentage": 11.18, "elapsed_time": "2:16:19", "remaining_time": "18:02:38"} +{"current_steps": 790, "total_steps": 7064, "loss": 0.8879, "reward": null, "learning_rate": 4.847281887633565e-05, "epoch": 0.22, "percentage": 11.18, "elapsed_time": "2:12:26", "remaining_time": "17:31:53"} +{"current_steps": 790, "total_steps": 7064, "loss": 0.8879, "reward": null, "learning_rate": 4.847281887633565e-05, "epoch": 0.22, "percentage": 11.18, "elapsed_time": "2:12:28", "remaining_time": "17:32:01"} +{"current_steps": 790, "total_steps": 7064, "loss": 0.8879, "reward": null, "learning_rate": 4.847281887633565e-05, "epoch": 0.22, "percentage": 11.18, "elapsed_time": "2:12:26", "remaining_time": "17:31:45"} +{"current_steps": 800, "total_steps": 7064, "loss": 0.8796, "reward": null, "learning_rate": 4.843432258735827e-05, "epoch": 0.23, "percentage": 11.33, "elapsed_time": "2:14:07", "remaining_time": "17:30:08"} +{"current_steps": 800, "total_steps": 7064, "loss": 0.8796, "reward": null, "learning_rate": 4.843432258735827e-05, "epoch": 0.23, "percentage": 11.33, "elapsed_time": "2:14:06", "remaining_time": "17:30:00"} +{"current_steps": 800, "total_steps": 7064, "loss": 0.8796, "reward": null, "learning_rate": 4.843432258735827e-05, "epoch": 0.23, "percentage": 11.33, "elapsed_time": "2:14:08", "remaining_time": "17:30:16"} +{"current_steps": 800, "total_steps": 7064, "loss": 0.8796, "reward": null, "learning_rate": 4.843432258735827e-05, "epoch": 0.23, "percentage": 11.33, "elapsed_time": "2:17:59", "remaining_time": "18:00:27"} +{"current_steps": 810, "total_steps": 7064, "loss": 0.8965, "reward": null, "learning_rate": 4.839536279804589e-05, "epoch": 0.23, "percentage": 11.47, "elapsed_time": "2:19:38", "remaining_time": "17:58:13"} +{"current_steps": 810, "total_steps": 7064, "loss": 0.8965, "reward": null, "learning_rate": 4.839536279804589e-05, "epoch": 0.23, "percentage": 11.47, "elapsed_time": "2:15:45", "remaining_time": "17:28:11"} +{"current_steps": 810, "total_steps": 7064, "loss": 0.8965, "reward": null, "learning_rate": 4.839536279804589e-05, "epoch": 0.23, "percentage": 11.47, "elapsed_time": "2:15:46", "remaining_time": "17:28:18"} +{"current_steps": 810, "total_steps": 7064, "loss": 0.8965, "reward": null, "learning_rate": 4.839536279804589e-05, "epoch": 0.23, "percentage": 11.47, "elapsed_time": "2:15:47", "remaining_time": "17:28:27"} +{"current_steps": 820, "total_steps": 7064, "loss": 0.8678, "reward": null, "learning_rate": 4.835594027897231e-05, "epoch": 0.23, "percentage": 11.61, "elapsed_time": "2:21:17", "remaining_time": "17:55:56"} +{"current_steps": 820, "total_steps": 7064, "loss": 0.8678, "reward": null, "learning_rate": 4.835594027897231e-05, "epoch": 0.23, "percentage": 11.61, "elapsed_time": "2:17:25", "remaining_time": "17:26:27"} +{"current_steps": 820, "total_steps": 7064, "loss": 0.8678, "reward": null, "learning_rate": 4.835594027897231e-05, "epoch": 0.23, "percentage": 11.61, "elapsed_time": "2:17:24", "remaining_time": "17:26:20"} +{"current_steps": 820, "total_steps": 7064, "loss": 0.8678, "reward": null, "learning_rate": 4.835594027897231e-05, "epoch": 0.23, "percentage": 11.61, "elapsed_time": "2:17:26", "remaining_time": "17:26:35"} +{"current_steps": 830, "total_steps": 7064, "loss": 0.8857, "reward": null, "learning_rate": 4.831605580986355e-05, "epoch": 0.23, "percentage": 11.75, "elapsed_time": "2:19:08", "remaining_time": "17:25:07"} +{"current_steps": 830, "total_steps": 7064, "loss": 0.8857, "reward": null, "learning_rate": 4.831605580986355e-05, "epoch": 0.23, "percentage": 11.75, "elapsed_time": "2:19:10", "remaining_time": "17:25:15"} +{"current_steps": 830, "total_steps": 7064, "loss": 0.8857, "reward": null, "learning_rate": 4.831605580986355e-05, "epoch": 0.23, "percentage": 11.75, "elapsed_time": "2:19:08", "remaining_time": "17:25:00"} +{"current_steps": 830, "total_steps": 7064, "loss": 0.8857, "reward": null, "learning_rate": 4.831605580986355e-05, "epoch": 0.23, "percentage": 11.75, "elapsed_time": "2:23:01", "remaining_time": "17:54:12"} +{"current_steps": 840, "total_steps": 7064, "loss": 0.8805, "reward": null, "learning_rate": 4.8275710179582366e-05, "epoch": 0.24, "percentage": 11.89, "elapsed_time": "2:20:46", "remaining_time": "17:23:07"} +{"current_steps": 840, "total_steps": 7064, "loss": 0.8805, "reward": null, "learning_rate": 4.8275710179582366e-05, "epoch": 0.24, "percentage": 11.89, "elapsed_time": "2:20:48", "remaining_time": "17:23:22"} +{"current_steps": 840, "total_steps": 7064, "loss": 0.8805, "reward": null, "learning_rate": 4.8275710179582366e-05, "epoch": 0.24, "percentage": 11.89, "elapsed_time": "2:20:47", "remaining_time": "17:23:14"} +{"current_steps": 840, "total_steps": 7064, "loss": 0.8805, "reward": null, "learning_rate": 4.8275710179582366e-05, "epoch": 0.24, "percentage": 11.89, "elapsed_time": "2:24:40", "remaining_time": "17:51:55"} +{"current_steps": 850, "total_steps": 7064, "loss": 0.865, "reward": null, "learning_rate": 4.823490418611273e-05, "epoch": 0.24, "percentage": 12.03, "elapsed_time": "2:22:30", "remaining_time": "17:21:48"} +{"current_steps": 850, "total_steps": 7064, "loss": 0.865, "reward": null, "learning_rate": 4.823490418611273e-05, "epoch": 0.24, "percentage": 12.03, "elapsed_time": "2:22:31", "remaining_time": "17:21:56"} +{"current_steps": 850, "total_steps": 7064, "loss": 0.865, "reward": null, "learning_rate": 4.823490418611273e-05, "epoch": 0.24, "percentage": 12.03, "elapsed_time": "2:22:29", "remaining_time": "17:21:41"} +{"current_steps": 850, "total_steps": 7064, "loss": 0.865, "reward": null, "learning_rate": 4.823490418611273e-05, "epoch": 0.24, "percentage": 12.03, "elapsed_time": "2:26:22", "remaining_time": "17:50:06"} +{"current_steps": 860, "total_steps": 7064, "loss": 0.8892, "reward": null, "learning_rate": 4.819363863654395e-05, "epoch": 0.24, "percentage": 12.17, "elapsed_time": "2:24:11", "remaining_time": "17:20:08"} +{"current_steps": 860, "total_steps": 7064, "loss": 0.8892, "reward": null, "learning_rate": 4.819363863654395e-05, "epoch": 0.24, "percentage": 12.17, "elapsed_time": "2:24:11", "remaining_time": "17:20:15"} +{"current_steps": 860, "total_steps": 7064, "loss": 0.8892, "reward": null, "learning_rate": 4.819363863654395e-05, "epoch": 0.24, "percentage": 12.17, "elapsed_time": "2:24:13", "remaining_time": "17:20:22"} +{"current_steps": 860, "total_steps": 7064, "loss": 0.8892, "reward": null, "learning_rate": 4.819363863654395e-05, "epoch": 0.24, "percentage": 12.17, "elapsed_time": "2:28:04", "remaining_time": "17:48:11"} +{"current_steps": 870, "total_steps": 7064, "loss": 0.8589, "reward": null, "learning_rate": 4.8151914347054776e-05, "epoch": 0.25, "percentage": 12.32, "elapsed_time": "2:29:48", "remaining_time": "17:46:31"} +{"current_steps": 870, "total_steps": 7064, "loss": 0.8589, "reward": null, "learning_rate": 4.8151914347054776e-05, "epoch": 0.25, "percentage": 12.32, "elapsed_time": "2:25:56", "remaining_time": "17:19:04"} +{"current_steps": 870, "total_steps": 7064, "loss": 0.8589, "reward": null, "learning_rate": 4.8151914347054776e-05, "epoch": 0.25, "percentage": 12.32, "elapsed_time": "2:25:54", "remaining_time": "17:18:50"} +{"current_steps": 870, "total_steps": 7064, "loss": 0.8589, "reward": null, "learning_rate": 4.8151914347054776e-05, "epoch": 0.25, "percentage": 12.32, "elapsed_time": "2:25:55", "remaining_time": "17:18:56"} +{"current_steps": 880, "total_steps": 7064, "loss": 0.8819, "reward": null, "learning_rate": 4.810973214289724e-05, "epoch": 0.25, "percentage": 12.46, "elapsed_time": "2:27:34", "remaining_time": "17:17:02"} +{"current_steps": 880, "total_steps": 7064, "loss": 0.8819, "reward": null, "learning_rate": 4.810973214289724e-05, "epoch": 0.25, "percentage": 12.46, "elapsed_time": "2:27:36", "remaining_time": "17:17:16"} +{"current_steps": 880, "total_steps": 7064, "loss": 0.8819, "reward": null, "learning_rate": 4.810973214289724e-05, "epoch": 0.25, "percentage": 12.46, "elapsed_time": "2:27:35", "remaining_time": "17:17:09"} +{"current_steps": 880, "total_steps": 7064, "loss": 0.8819, "reward": null, "learning_rate": 4.810973214289724e-05, "epoch": 0.25, "percentage": 12.46, "elapsed_time": "2:31:27", "remaining_time": "17:44:22"} +{"current_steps": 890, "total_steps": 7064, "loss": 0.8778, "reward": null, "learning_rate": 4.806709285838031e-05, "epoch": 0.25, "percentage": 12.6, "elapsed_time": "2:33:09", "remaining_time": "17:42:29"} +{"current_steps": 890, "total_steps": 7064, "loss": 0.8778, "reward": null, "learning_rate": 4.806709285838031e-05, "epoch": 0.25, "percentage": 12.6, "elapsed_time": "2:29:16", "remaining_time": "17:15:31"} +{"current_steps": 890, "total_steps": 7064, "loss": 0.8778, "reward": null, "learning_rate": 4.806709285838031e-05, "epoch": 0.25, "percentage": 12.6, "elapsed_time": "2:29:17", "remaining_time": "17:15:37"} +{"current_steps": 890, "total_steps": 7064, "loss": 0.8778, "reward": null, "learning_rate": 4.806709285838031e-05, "epoch": 0.25, "percentage": 12.6, "elapsed_time": "2:29:18", "remaining_time": "17:15:45"} +{"current_steps": 900, "total_steps": 7064, "loss": 0.8725, "reward": null, "learning_rate": 4.8023997336853434e-05, "epoch": 0.25, "percentage": 12.74, "elapsed_time": "2:34:52", "remaining_time": "17:40:41"} +{"current_steps": 900, "total_steps": 7064, "loss": 0.8725, "reward": null, "learning_rate": 4.8023997336853434e-05, "epoch": 0.25, "percentage": 12.74, "elapsed_time": "2:30:58", "remaining_time": "17:14:03"} +{"current_steps": 900, "total_steps": 7064, "loss": 0.8725, "reward": null, "learning_rate": 4.8023997336853434e-05, "epoch": 0.25, "percentage": 12.74, "elapsed_time": "2:31:00", "remaining_time": "17:14:17"} +{"current_steps": 900, "total_steps": 7064, "loss": 0.8725, "reward": null, "learning_rate": 4.8023997336853434e-05, "epoch": 0.25, "percentage": 12.74, "elapsed_time": "2:30:59", "remaining_time": "17:14:10"} +{"current_steps": 910, "total_steps": 7064, "loss": 0.8856, "reward": null, "learning_rate": 4.7980446430689804e-05, "epoch": 0.26, "percentage": 12.88, "elapsed_time": "2:36:33", "remaining_time": "17:38:47"} +{"current_steps": 910, "total_steps": 7064, "loss": 0.8856, "reward": null, "learning_rate": 4.7980446430689804e-05, "epoch": 0.26, "percentage": 12.88, "elapsed_time": "2:32:42", "remaining_time": "17:12:43"} +{"current_steps": 910, "total_steps": 7064, "loss": 0.8856, "reward": null, "learning_rate": 4.7980446430689804e-05, "epoch": 0.26, "percentage": 12.88, "elapsed_time": "2:32:41", "remaining_time": "17:12:36"} +{"current_steps": 910, "total_steps": 7064, "loss": 0.8856, "reward": null, "learning_rate": 4.7980446430689804e-05, "epoch": 0.26, "percentage": 12.88, "elapsed_time": "2:32:40", "remaining_time": "17:12:29"} +{"current_steps": 920, "total_steps": 7064, "loss": 0.8836, "reward": null, "learning_rate": 4.793644100126954e-05, "epoch": 0.26, "percentage": 13.02, "elapsed_time": "2:38:08", "remaining_time": "17:36:09"} +{"current_steps": 920, "total_steps": 7064, "loss": 0.8836, "reward": null, "learning_rate": 4.793644100126954e-05, "epoch": 0.26, "percentage": 13.02, "elapsed_time": "2:34:17", "remaining_time": "17:10:24"} +{"current_steps": 920, "total_steps": 7064, "loss": 0.8836, "reward": null, "learning_rate": 4.793644100126954e-05, "epoch": 0.26, "percentage": 13.02, "elapsed_time": "2:34:16", "remaining_time": "17:10:17"} +{"current_steps": 920, "total_steps": 7064, "loss": 0.8836, "reward": null, "learning_rate": 4.793644100126954e-05, "epoch": 0.26, "percentage": 13.02, "elapsed_time": "2:34:15", "remaining_time": "17:10:11"} +{"current_steps": 930, "total_steps": 7064, "loss": 0.8684, "reward": null, "learning_rate": 4.7891981918962656e-05, "epoch": 0.26, "percentage": 13.17, "elapsed_time": "2:39:46", "remaining_time": "17:33:52"} +{"current_steps": 930, "total_steps": 7064, "loss": 0.8684, "reward": null, "learning_rate": 4.7891981918962656e-05, "epoch": 0.26, "percentage": 13.17, "elapsed_time": "2:35:55", "remaining_time": "17:08:27"} +{"current_steps": 930, "total_steps": 7064, "loss": 0.8684, "reward": null, "learning_rate": 4.7891981918962656e-05, "epoch": 0.26, "percentage": 13.17, "elapsed_time": "2:35:53", "remaining_time": "17:08:14"} +{"current_steps": 930, "total_steps": 7064, "loss": 0.8684, "reward": null, "learning_rate": 4.7891981918962656e-05, "epoch": 0.26, "percentage": 13.17, "elapsed_time": "2:35:54", "remaining_time": "17:08:20"} +{"current_steps": 940, "total_steps": 7064, "loss": 0.8671, "reward": null, "learning_rate": 4.784707006311179e-05, "epoch": 0.27, "percentage": 13.31, "elapsed_time": "2:41:26", "remaining_time": "17:31:47"} +{"current_steps": 940, "total_steps": 7064, "loss": 0.8671, "reward": null, "learning_rate": 4.784707006311179e-05, "epoch": 0.27, "percentage": 13.31, "elapsed_time": "2:37:35", "remaining_time": "17:06:40"} +{"current_steps": 940, "total_steps": 7064, "loss": 0.8671, "reward": null, "learning_rate": 4.784707006311179e-05, "epoch": 0.27, "percentage": 13.31, "elapsed_time": "2:37:34", "remaining_time": "17:06:33"} +{"current_steps": 940, "total_steps": 7064, "loss": 0.8671, "reward": null, "learning_rate": 4.784707006311179e-05, "epoch": 0.27, "percentage": 13.31, "elapsed_time": "2:37:33", "remaining_time": "17:06:27"} +{"current_steps": 950, "total_steps": 7064, "loss": 0.868, "reward": null, "learning_rate": 4.780170632201487e-05, "epoch": 0.27, "percentage": 13.45, "elapsed_time": "2:43:07", "remaining_time": "17:29:50"} +{"current_steps": 950, "total_steps": 7064, "loss": 0.868, "reward": null, "learning_rate": 4.780170632201487e-05, "epoch": 0.27, "percentage": 13.45, "elapsed_time": "2:39:14", "remaining_time": "17:04:48"} +{"current_steps": 950, "total_steps": 7064, "loss": 0.868, "reward": null, "learning_rate": 4.780170632201487e-05, "epoch": 0.27, "percentage": 13.45, "elapsed_time": "2:39:15", "remaining_time": "17:04:54"} +{"current_steps": 950, "total_steps": 7064, "loss": 0.868, "reward": null, "learning_rate": 4.780170632201487e-05, "epoch": 0.27, "percentage": 13.45, "elapsed_time": "2:39:16", "remaining_time": "17:05:01"} +{"current_steps": 960, "total_steps": 7064, "loss": 0.8683, "reward": null, "learning_rate": 4.7755891592907556e-05, "epoch": 0.27, "percentage": 13.59, "elapsed_time": "2:44:50", "remaining_time": "17:28:05"} +{"current_steps": 960, "total_steps": 7064, "loss": 0.8683, "reward": null, "learning_rate": 4.7755891592907556e-05, "epoch": 0.27, "percentage": 13.59, "elapsed_time": "2:40:58", "remaining_time": "17:03:34"} +{"current_steps": 960, "total_steps": 7064, "loss": 0.8683, "reward": null, "learning_rate": 4.7755891592907556e-05, "epoch": 0.27, "percentage": 13.59, "elapsed_time": "2:40:56", "remaining_time": "17:03:21"} +{"current_steps": 960, "total_steps": 7064, "loss": 0.8683, "reward": null, "learning_rate": 4.7755891592907556e-05, "epoch": 0.27, "percentage": 13.59, "elapsed_time": "2:40:57", "remaining_time": "17:03:27"} +{"current_steps": 970, "total_steps": 7064, "loss": 0.8581, "reward": null, "learning_rate": 4.7709626781945397e-05, "epoch": 0.27, "percentage": 13.73, "elapsed_time": "2:46:28", "remaining_time": "17:25:51"} +{"current_steps": 970, "total_steps": 7064, "loss": 0.8581, "reward": null, "learning_rate": 4.7709626781945397e-05, "epoch": 0.27, "percentage": 13.73, "elapsed_time": "2:42:35", "remaining_time": "17:01:31"} +{"current_steps": 970, "total_steps": 7064, "loss": 0.8581, "reward": null, "learning_rate": 4.7709626781945397e-05, "epoch": 0.27, "percentage": 13.73, "elapsed_time": "2:42:35", "remaining_time": "17:01:25"} +{"current_steps": 970, "total_steps": 7064, "loss": 0.8581, "reward": null, "learning_rate": 4.7709626781945397e-05, "epoch": 0.27, "percentage": 13.73, "elapsed_time": "2:42:37", "remaining_time": "17:01:38"} +{"current_steps": 980, "total_steps": 7064, "loss": 0.8653, "reward": null, "learning_rate": 4.766291280418603e-05, "epoch": 0.28, "percentage": 13.87, "elapsed_time": "2:48:06", "remaining_time": "17:23:37"} +{"current_steps": 980, "total_steps": 7064, "loss": 0.8653, "reward": null, "learning_rate": 4.766291280418603e-05, "epoch": 0.28, "percentage": 13.87, "elapsed_time": "2:44:15", "remaining_time": "16:59:42"} +{"current_steps": 980, "total_steps": 7064, "loss": 0.8653, "reward": null, "learning_rate": 4.766291280418603e-05, "epoch": 0.28, "percentage": 13.87, "elapsed_time": "2:44:14", "remaining_time": "16:59:35"} +{"current_steps": 980, "total_steps": 7064, "loss": 0.8653, "reward": null, "learning_rate": 4.766291280418603e-05, "epoch": 0.28, "percentage": 13.87, "elapsed_time": "2:44:13", "remaining_time": "16:59:29"} +{"current_steps": 990, "total_steps": 7064, "loss": 0.8677, "reward": null, "learning_rate": 4.761575058357101e-05, "epoch": 0.28, "percentage": 14.01, "elapsed_time": "2:45:52", "remaining_time": "16:57:45"} +{"current_steps": 990, "total_steps": 7064, "loss": 0.8677, "reward": null, "learning_rate": 4.761575058357101e-05, "epoch": 0.28, "percentage": 14.01, "elapsed_time": "2:49:44", "remaining_time": "17:21:24"} +{"current_steps": 990, "total_steps": 7064, "loss": 0.8677, "reward": null, "learning_rate": 4.761575058357101e-05, "epoch": 0.28, "percentage": 14.01, "elapsed_time": "2:45:50", "remaining_time": "16:57:32"} +{"current_steps": 990, "total_steps": 7064, "loss": 0.8677, "reward": null, "learning_rate": 4.761575058357101e-05, "epoch": 0.28, "percentage": 14.01, "elapsed_time": "2:45:51", "remaining_time": "16:57:38"} +{"current_steps": 1000, "total_steps": 7064, "loss": 0.8734, "reward": null, "learning_rate": 4.756814105290753e-05, "epoch": 0.28, "percentage": 14.16, "elapsed_time": "2:47:30", "remaining_time": "16:55:48"} +{"current_steps": 1000, "total_steps": 7064, "loss": 0.8734, "reward": null, "learning_rate": 4.756814105290753e-05, "epoch": 0.28, "percentage": 14.16, "elapsed_time": "2:47:29", "remaining_time": "16:55:43"} +{"current_steps": 1000, "total_steps": 7064, "loss": 0.8734, "reward": null, "learning_rate": 4.756814105290753e-05, "epoch": 0.28, "percentage": 14.16, "elapsed_time": "2:47:32", "remaining_time": "16:55:55"} +{"current_steps": 1000, "total_steps": 7064, "loss": 0.8734, "reward": null, "learning_rate": 4.756814105290753e-05, "epoch": 0.28, "percentage": 14.16, "elapsed_time": "2:51:23", "remaining_time": "17:19:17"} +{"current_steps": 1010, "total_steps": 7064, "loss": 0.8583, "reward": null, "learning_rate": 4.7520085153850014e-05, "epoch": 0.29, "percentage": 14.3, "elapsed_time": "2:53:04", "remaining_time": "17:17:22"} +{"current_steps": 1010, "total_steps": 7064, "loss": 0.8583, "reward": null, "learning_rate": 4.7520085153850014e-05, "epoch": 0.29, "percentage": 14.3, "elapsed_time": "2:49:11", "remaining_time": "16:54:09"} +{"current_steps": 1010, "total_steps": 7064, "loss": 0.8583, "reward": null, "learning_rate": 4.7520085153850014e-05, "epoch": 0.29, "percentage": 14.3, "elapsed_time": "2:49:10", "remaining_time": "16:54:04"} +{"current_steps": 1010, "total_steps": 7064, "loss": 0.8583, "reward": null, "learning_rate": 4.7520085153850014e-05, "epoch": 0.29, "percentage": 14.3, "elapsed_time": "2:49:12", "remaining_time": "16:54:16"} +{"current_steps": 1020, "total_steps": 7064, "loss": 0.874, "reward": null, "learning_rate": 4.7471583836881476e-05, "epoch": 0.29, "percentage": 14.44, "elapsed_time": "2:54:43", "remaining_time": "17:15:21"} +{"current_steps": 1020, "total_steps": 7064, "loss": 0.874, "reward": null, "learning_rate": 4.7471583836881476e-05, "epoch": 0.29, "percentage": 14.44, "elapsed_time": "2:50:50", "remaining_time": "16:52:19"} +{"current_steps": 1020, "total_steps": 7064, "loss": 0.874, "reward": null, "learning_rate": 4.7471583836881476e-05, "epoch": 0.29, "percentage": 14.44, "elapsed_time": "2:50:52", "remaining_time": "16:52:31"} +{"current_steps": 1020, "total_steps": 7064, "loss": 0.874, "reward": null, "learning_rate": 4.7471583836881476e-05, "epoch": 0.29, "percentage": 14.44, "elapsed_time": "2:50:51", "remaining_time": "16:52:24"} +{"current_steps": 1030, "total_steps": 7064, "loss": 0.8554, "reward": null, "learning_rate": 4.742263806129469e-05, "epoch": 0.29, "percentage": 14.58, "elapsed_time": "2:56:26", "remaining_time": "17:13:38"} +{"current_steps": 1030, "total_steps": 7064, "loss": 0.8554, "reward": null, "learning_rate": 4.742263806129469e-05, "epoch": 0.29, "percentage": 14.58, "elapsed_time": "2:52:35", "remaining_time": "16:51:03"} +{"current_steps": 1030, "total_steps": 7064, "loss": 0.8554, "reward": null, "learning_rate": 4.742263806129469e-05, "epoch": 0.29, "percentage": 14.58, "elapsed_time": "2:52:33", "remaining_time": "16:50:51"} +{"current_steps": 1030, "total_steps": 7064, "loss": 0.8554, "reward": null, "learning_rate": 4.742263806129469e-05, "epoch": 0.29, "percentage": 14.58, "elapsed_time": "2:52:34", "remaining_time": "16:50:57"} +{"current_steps": 1040, "total_steps": 7064, "loss": 0.8807, "reward": null, "learning_rate": 4.737324879517326e-05, "epoch": 0.29, "percentage": 14.72, "elapsed_time": "2:54:16", "remaining_time": "16:49:27"} +{"current_steps": 1040, "total_steps": 7064, "loss": 0.8807, "reward": null, "learning_rate": 4.737324879517326e-05, "epoch": 0.29, "percentage": 14.72, "elapsed_time": "2:54:15", "remaining_time": "16:49:21"} +{"current_steps": 1040, "total_steps": 7064, "loss": 0.8807, "reward": null, "learning_rate": 4.737324879517326e-05, "epoch": 0.29, "percentage": 14.72, "elapsed_time": "2:54:14", "remaining_time": "16:49:15"} +{"current_steps": 1040, "total_steps": 7064, "loss": 0.8807, "reward": null, "learning_rate": 4.737324879517326e-05, "epoch": 0.29, "percentage": 14.72, "elapsed_time": "2:58:07", "remaining_time": "17:11:47"} +{"current_steps": 1050, "total_steps": 7064, "loss": 0.8633, "reward": null, "learning_rate": 4.732341701537245e-05, "epoch": 0.3, "percentage": 14.86, "elapsed_time": "2:59:48", "remaining_time": "17:09:50"} +{"current_steps": 1050, "total_steps": 7064, "loss": 0.8633, "reward": null, "learning_rate": 4.732341701537245e-05, "epoch": 0.3, "percentage": 14.86, "elapsed_time": "2:55:56", "remaining_time": "16:47:45"} +{"current_steps": 1050, "total_steps": 7064, "loss": 0.8633, "reward": null, "learning_rate": 4.732341701537245e-05, "epoch": 0.3, "percentage": 14.86, "elapsed_time": "2:55:54", "remaining_time": "16:47:34"} +{"current_steps": 1050, "total_steps": 7064, "loss": 0.8633, "reward": null, "learning_rate": 4.732341701537245e-05, "epoch": 0.3, "percentage": 14.86, "elapsed_time": "2:55:55", "remaining_time": "16:47:39"} +{"current_steps": 1060, "total_steps": 7064, "loss": 0.875, "reward": null, "learning_rate": 4.727314370749988e-05, "epoch": 0.3, "percentage": 15.01, "elapsed_time": "3:01:29", "remaining_time": "17:08:00"} +{"current_steps": 1060, "total_steps": 7064, "loss": 0.875, "reward": null, "learning_rate": 4.727314370749988e-05, "epoch": 0.3, "percentage": 15.01, "elapsed_time": "2:57:38", "remaining_time": "16:46:10"} +{"current_steps": 1060, "total_steps": 7064, "loss": 0.875, "reward": null, "learning_rate": 4.727314370749988e-05, "epoch": 0.3, "percentage": 15.01, "elapsed_time": "2:57:36", "remaining_time": "16:45:58"} +{"current_steps": 1060, "total_steps": 7064, "loss": 0.875, "reward": null, "learning_rate": 4.727314370749988e-05, "epoch": 0.3, "percentage": 15.01, "elapsed_time": "2:57:37", "remaining_time": "16:46:03"} +{"current_steps": 1070, "total_steps": 7064, "loss": 0.8709, "reward": null, "learning_rate": 4.7222429865896e-05, "epoch": 0.3, "percentage": 15.15, "elapsed_time": "2:59:17", "remaining_time": "16:44:22"} +{"current_steps": 1070, "total_steps": 7064, "loss": 0.8709, "reward": null, "learning_rate": 4.7222429865896e-05, "epoch": 0.3, "percentage": 15.15, "elapsed_time": "3:03:09", "remaining_time": "17:06:04"} +{"current_steps": 1070, "total_steps": 7064, "loss": 0.8709, "reward": null, "learning_rate": 4.7222429865896e-05, "epoch": 0.3, "percentage": 15.15, "elapsed_time": "2:59:18", "remaining_time": "16:44:28"} +{"current_steps": 1070, "total_steps": 7064, "loss": 0.8709, "reward": null, "learning_rate": 4.7222429865896e-05, "epoch": 0.3, "percentage": 15.15, "elapsed_time": "2:59:16", "remaining_time": "16:44:17"} +{"current_steps": 1080, "total_steps": 7064, "loss": 0.8634, "reward": null, "learning_rate": 4.717127649361444e-05, "epoch": 0.31, "percentage": 15.29, "elapsed_time": "3:04:49", "remaining_time": "17:04:03"} +{"current_steps": 1080, "total_steps": 7064, "loss": 0.8634, "reward": null, "learning_rate": 4.717127649361444e-05, "epoch": 0.31, "percentage": 15.29, "elapsed_time": "3:00:58", "remaining_time": "16:42:41"} +{"current_steps": 1080, "total_steps": 7064, "loss": 0.8634, "reward": null, "learning_rate": 4.717127649361444e-05, "epoch": 0.31, "percentage": 15.29, "elapsed_time": "3:00:57", "remaining_time": "16:42:35"} +{"current_steps": 1080, "total_steps": 7064, "loss": 0.8634, "reward": null, "learning_rate": 4.717127649361444e-05, "epoch": 0.31, "percentage": 15.29, "elapsed_time": "3:00:56", "remaining_time": "16:42:30"} +{"current_steps": 1090, "total_steps": 7064, "loss": 0.8566, "reward": null, "learning_rate": 4.71196846024022e-05, "epoch": 0.31, "percentage": 15.43, "elapsed_time": "3:02:35", "remaining_time": "16:40:43"} +{"current_steps": 1090, "total_steps": 7064, "loss": 0.8566, "reward": null, "learning_rate": 4.71196846024022e-05, "epoch": 0.31, "percentage": 15.43, "elapsed_time": "3:06:28", "remaining_time": "17:02:02"} +{"current_steps": 1090, "total_steps": 7064, "loss": 0.8566, "reward": null, "learning_rate": 4.71196846024022e-05, "epoch": 0.31, "percentage": 15.43, "elapsed_time": "3:02:36", "remaining_time": "16:40:48"} +{"current_steps": 1090, "total_steps": 7064, "loss": 0.8566, "reward": null, "learning_rate": 4.71196846024022e-05, "epoch": 0.31, "percentage": 15.43, "elapsed_time": "3:02:37", "remaining_time": "16:40:54"} +{"current_steps": 1100, "total_steps": 7064, "loss": 0.8667, "reward": null, "learning_rate": 4.7067655212679585e-05, "epoch": 0.31, "percentage": 15.57, "elapsed_time": "3:08:08", "remaining_time": "17:00:04"} +{"current_steps": 1100, "total_steps": 7064, "loss": 0.8667, "reward": null, "learning_rate": 4.7067655212679585e-05, "epoch": 0.31, "percentage": 15.57, "elapsed_time": "3:04:15", "remaining_time": "16:38:59"} +{"current_steps": 1100, "total_steps": 7064, "loss": 0.8667, "reward": null, "learning_rate": 4.7067655212679585e-05, "epoch": 0.31, "percentage": 15.57, "elapsed_time": "3:04:17", "remaining_time": "16:39:10"} +{"current_steps": 1100, "total_steps": 7064, "loss": 0.8667, "reward": null, "learning_rate": 4.7067655212679585e-05, "epoch": 0.31, "percentage": 15.57, "elapsed_time": "3:04:16", "remaining_time": "16:39:04"} +{"current_steps": 1110, "total_steps": 7064, "loss": 0.8688, "reward": null, "learning_rate": 4.701518935352006e-05, "epoch": 0.31, "percentage": 15.71, "elapsed_time": "3:05:59", "remaining_time": "16:37:41"} +{"current_steps": 1110, "total_steps": 7064, "loss": 0.8688, "reward": null, "learning_rate": 4.701518935352006e-05, "epoch": 0.31, "percentage": 15.71, "elapsed_time": "3:05:57", "remaining_time": "16:37:30"} +{"current_steps": 1110, "total_steps": 7064, "loss": 0.8688, "reward": null, "learning_rate": 4.701518935352006e-05, "epoch": 0.31, "percentage": 15.71, "elapsed_time": "3:05:58", "remaining_time": "16:37:35"} +{"current_steps": 1110, "total_steps": 7064, "loss": 0.8688, "reward": null, "learning_rate": 4.701518935352006e-05, "epoch": 0.31, "percentage": 15.71, "elapsed_time": "3:09:51", "remaining_time": "16:58:22"} +{"current_steps": 1120, "total_steps": 7064, "loss": 0.8573, "reward": null, "learning_rate": 4.69622880626299e-05, "epoch": 0.32, "percentage": 15.86, "elapsed_time": "3:07:38", "remaining_time": "16:35:48"} +{"current_steps": 1120, "total_steps": 7064, "loss": 0.8573, "reward": null, "learning_rate": 4.69622880626299e-05, "epoch": 0.32, "percentage": 15.86, "elapsed_time": "3:07:40", "remaining_time": "16:35:59"} +{"current_steps": 1120, "total_steps": 7064, "loss": 0.8573, "reward": null, "learning_rate": 4.69622880626299e-05, "epoch": 0.32, "percentage": 15.86, "elapsed_time": "3:07:39", "remaining_time": "16:35:53"} +{"current_steps": 1120, "total_steps": 7064, "loss": 0.8573, "reward": null, "learning_rate": 4.69622880626299e-05, "epoch": 0.32, "percentage": 15.86, "elapsed_time": "3:11:31", "remaining_time": "16:56:26"} +{"current_steps": 1130, "total_steps": 7064, "loss": 0.8576, "reward": null, "learning_rate": 4.690895238632762e-05, "epoch": 0.32, "percentage": 16.0, "elapsed_time": "3:09:20", "remaining_time": "16:34:15"} +{"current_steps": 1130, "total_steps": 7064, "loss": 0.8576, "reward": null, "learning_rate": 4.690895238632762e-05, "epoch": 0.32, "percentage": 16.0, "elapsed_time": "3:09:19", "remaining_time": "16:34:10"} +{"current_steps": 1130, "total_steps": 7064, "loss": 0.8576, "reward": null, "learning_rate": 4.690895238632762e-05, "epoch": 0.32, "percentage": 16.0, "elapsed_time": "3:09:21", "remaining_time": "16:34:21"} +{"current_steps": 1130, "total_steps": 7064, "loss": 0.8576, "reward": null, "learning_rate": 4.690895238632762e-05, "epoch": 0.32, "percentage": 16.0, "elapsed_time": "3:13:12", "remaining_time": "16:54:35"} +{"current_steps": 1140, "total_steps": 7064, "loss": 0.8525, "reward": null, "learning_rate": 4.685518337952335e-05, "epoch": 0.32, "percentage": 16.14, "elapsed_time": "3:14:52", "remaining_time": "16:52:38"} +{"current_steps": 1140, "total_steps": 7064, "loss": 0.8525, "reward": null, "learning_rate": 4.685518337952335e-05, "epoch": 0.32, "percentage": 16.14, "elapsed_time": "3:10:59", "remaining_time": "16:32:31"} +{"current_steps": 1140, "total_steps": 7064, "loss": 0.8525, "reward": null, "learning_rate": 4.685518337952335e-05, "epoch": 0.32, "percentage": 16.14, "elapsed_time": "3:11:01", "remaining_time": "16:32:37"} +{"current_steps": 1140, "total_steps": 7064, "loss": 0.8525, "reward": null, "learning_rate": 4.685518337952335e-05, "epoch": 0.32, "percentage": 16.14, "elapsed_time": "3:10:58", "remaining_time": "16:32:26"} +{"current_steps": 1150, "total_steps": 7064, "loss": 0.8656, "reward": null, "learning_rate": 4.680098210569789e-05, "epoch": 0.33, "percentage": 16.28, "elapsed_time": "3:16:30", "remaining_time": "16:50:34"} +{"current_steps": 1150, "total_steps": 7064, "loss": 0.8656, "reward": null, "learning_rate": 4.680098210569789e-05, "epoch": 0.33, "percentage": 16.28, "elapsed_time": "3:12:38", "remaining_time": "16:30:38"} +{"current_steps": 1150, "total_steps": 7064, "loss": 0.8656, "reward": null, "learning_rate": 4.680098210569789e-05, "epoch": 0.33, "percentage": 16.28, "elapsed_time": "3:12:39", "remaining_time": "16:30:44"} +{"current_steps": 1150, "total_steps": 7064, "loss": 0.8656, "reward": null, "learning_rate": 4.680098210569789e-05, "epoch": 0.33, "percentage": 16.28, "elapsed_time": "3:12:37", "remaining_time": "16:30:34"} +{"current_steps": 1160, "total_steps": 7064, "loss": 0.8703, "reward": null, "learning_rate": 4.674634963688177e-05, "epoch": 0.33, "percentage": 16.42, "elapsed_time": "3:18:15", "remaining_time": "16:49:06"} +{"current_steps": 1160, "total_steps": 7064, "loss": 0.8703, "reward": null, "learning_rate": 4.674634963688177e-05, "epoch": 0.33, "percentage": 16.42, "elapsed_time": "3:14:24", "remaining_time": "16:29:29"} +{"current_steps": 1160, "total_steps": 7064, "loss": 0.8703, "reward": null, "learning_rate": 4.674634963688177e-05, "epoch": 0.33, "percentage": 16.42, "elapsed_time": "3:14:23", "remaining_time": "16:29:23"} +{"current_steps": 1160, "total_steps": 7064, "loss": 0.8703, "reward": null, "learning_rate": 4.674634963688177e-05, "epoch": 0.33, "percentage": 16.42, "elapsed_time": "3:14:22", "remaining_time": "16:29:18"} +{"current_steps": 1170, "total_steps": 7064, "loss": 0.8616, "reward": null, "learning_rate": 4.669128705363394e-05, "epoch": 0.33, "percentage": 16.56, "elapsed_time": "3:16:06", "remaining_time": "16:27:53"} +{"current_steps": 1170, "total_steps": 7064, "loss": 0.8616, "reward": null, "learning_rate": 4.669128705363394e-05, "epoch": 0.33, "percentage": 16.56, "elapsed_time": "3:16:07", "remaining_time": "16:27:59"} +{"current_steps": 1170, "total_steps": 7064, "loss": 0.8616, "reward": null, "learning_rate": 4.669128705363394e-05, "epoch": 0.33, "percentage": 16.56, "elapsed_time": "3:16:05", "remaining_time": "16:27:49"} +{"current_steps": 1170, "total_steps": 7064, "loss": 0.8616, "reward": null, "learning_rate": 4.669128705363394e-05, "epoch": 0.33, "percentage": 16.56, "elapsed_time": "3:19:58", "remaining_time": "16:47:24"} +{"current_steps": 1180, "total_steps": 7064, "loss": 0.8677, "reward": null, "learning_rate": 4.663579544502049e-05, "epoch": 0.33, "percentage": 16.7, "elapsed_time": "3:17:44", "remaining_time": "16:26:00"} +{"current_steps": 1180, "total_steps": 7064, "loss": 0.8677, "reward": null, "learning_rate": 4.663579544502049e-05, "epoch": 0.33, "percentage": 16.7, "elapsed_time": "3:21:37", "remaining_time": "16:45:24"} +{"current_steps": 1180, "total_steps": 7064, "loss": 0.8677, "reward": null, "learning_rate": 4.663579544502049e-05, "epoch": 0.33, "percentage": 16.7, "elapsed_time": "3:17:45", "remaining_time": "16:26:05"} +{"current_steps": 1180, "total_steps": 7064, "loss": 0.8677, "reward": null, "learning_rate": 4.663579544502049e-05, "epoch": 0.33, "percentage": 16.7, "elapsed_time": "3:17:46", "remaining_time": "16:26:10"} +{"current_steps": 1190, "total_steps": 7064, "loss": 0.8525, "reward": null, "learning_rate": 4.657987590859305e-05, "epoch": 0.34, "percentage": 16.85, "elapsed_time": "3:23:18", "remaining_time": "16:43:33"} +{"current_steps": 1190, "total_steps": 7064, "loss": 0.8525, "reward": null, "learning_rate": 4.657987590859305e-05, "epoch": 0.34, "percentage": 16.85, "elapsed_time": "3:19:25", "remaining_time": "16:24:21"} +{"current_steps": 1190, "total_steps": 7064, "loss": 0.8525, "reward": null, "learning_rate": 4.657987590859305e-05, "epoch": 0.34, "percentage": 16.85, "elapsed_time": "3:19:27", "remaining_time": "16:24:31"} +{"current_steps": 1190, "total_steps": 7064, "loss": 0.8525, "reward": null, "learning_rate": 4.657987590859305e-05, "epoch": 0.34, "percentage": 16.85, "elapsed_time": "3:19:26", "remaining_time": "16:24:26"} +{"current_steps": 1200, "total_steps": 7064, "loss": 0.8526, "reward": null, "learning_rate": 4.652352955036713e-05, "epoch": 0.34, "percentage": 16.99, "elapsed_time": "3:21:10", "remaining_time": "16:23:03"} +{"current_steps": 1200, "total_steps": 7064, "loss": 0.8526, "reward": null, "learning_rate": 4.652352955036713e-05, "epoch": 0.34, "percentage": 16.99, "elapsed_time": "3:21:11", "remaining_time": "16:23:07"} +{"current_steps": 1200, "total_steps": 7064, "loss": 0.8526, "reward": null, "learning_rate": 4.652352955036713e-05, "epoch": 0.34, "percentage": 16.99, "elapsed_time": "3:21:12", "remaining_time": "16:23:13"} +{"current_steps": 1200, "total_steps": 7064, "loss": 0.8526, "reward": null, "learning_rate": 4.652352955036713e-05, "epoch": 0.34, "percentage": 16.99, "elapsed_time": "3:25:03", "remaining_time": "16:42:03"} +{"current_steps": 1210, "total_steps": 7064, "loss": 0.8586, "reward": null, "learning_rate": 4.646675748480019e-05, "epoch": 0.34, "percentage": 17.13, "elapsed_time": "3:26:43", "remaining_time": "16:40:09"} +{"current_steps": 1210, "total_steps": 7064, "loss": 0.8586, "reward": null, "learning_rate": 4.646675748480019e-05, "epoch": 0.34, "percentage": 17.13, "elapsed_time": "3:22:51", "remaining_time": "16:21:25"} +{"current_steps": 1210, "total_steps": 7064, "loss": 0.8586, "reward": null, "learning_rate": 4.646675748480019e-05, "epoch": 0.34, "percentage": 17.13, "elapsed_time": "3:22:52", "remaining_time": "16:21:30"} +{"current_steps": 1210, "total_steps": 7064, "loss": 0.8586, "reward": null, "learning_rate": 4.646675748480019e-05, "epoch": 0.34, "percentage": 17.13, "elapsed_time": "3:22:50", "remaining_time": "16:21:21"} +{"current_steps": 1220, "total_steps": 7064, "loss": 0.8542, "reward": null, "learning_rate": 4.640956083476964e-05, "epoch": 0.35, "percentage": 17.27, "elapsed_time": "3:28:25", "remaining_time": "16:38:21"} +{"current_steps": 1220, "total_steps": 7064, "loss": 0.8542, "reward": null, "learning_rate": 4.640956083476964e-05, "epoch": 0.35, "percentage": 17.27, "elapsed_time": "3:24:33", "remaining_time": "16:19:53"} +{"current_steps": 1220, "total_steps": 7064, "loss": 0.8542, "reward": null, "learning_rate": 4.640956083476964e-05, "epoch": 0.35, "percentage": 17.27, "elapsed_time": "3:24:31", "remaining_time": "16:19:43"} +{"current_steps": 1220, "total_steps": 7064, "loss": 0.8542, "reward": null, "learning_rate": 4.640956083476964e-05, "epoch": 0.35, "percentage": 17.27, "elapsed_time": "3:24:32", "remaining_time": "16:19:48"} +{"current_steps": 1230, "total_steps": 7064, "loss": 0.8517, "reward": null, "learning_rate": 4.635194073155061e-05, "epoch": 0.35, "percentage": 17.41, "elapsed_time": "3:30:07", "remaining_time": "16:36:38"} +{"current_steps": 1230, "total_steps": 7064, "loss": 0.8517, "reward": null, "learning_rate": 4.635194073155061e-05, "epoch": 0.35, "percentage": 17.41, "elapsed_time": "3:26:15", "remaining_time": "16:18:16"} +{"current_steps": 1230, "total_steps": 7064, "loss": 0.8517, "reward": null, "learning_rate": 4.635194073155061e-05, "epoch": 0.35, "percentage": 17.41, "elapsed_time": "3:26:16", "remaining_time": "16:18:21"} +{"current_steps": 1230, "total_steps": 7064, "loss": 0.8517, "reward": null, "learning_rate": 4.635194073155061e-05, "epoch": 0.35, "percentage": 17.41, "elapsed_time": "3:26:14", "remaining_time": "16:18:11"} +{"current_steps": 1240, "total_steps": 7064, "loss": 0.8592, "reward": null, "learning_rate": 4.62938983147936e-05, "epoch": 0.35, "percentage": 17.55, "elapsed_time": "3:31:47", "remaining_time": "16:34:42"} +{"current_steps": 1240, "total_steps": 7064, "loss": 0.8592, "reward": null, "learning_rate": 4.62938983147936e-05, "epoch": 0.35, "percentage": 17.55, "elapsed_time": "3:27:53", "remaining_time": "16:16:26"} +{"current_steps": 1240, "total_steps": 7064, "loss": 0.8592, "reward": null, "learning_rate": 4.62938983147936e-05, "epoch": 0.35, "percentage": 17.55, "elapsed_time": "3:27:55", "remaining_time": "16:16:36"} +{"current_steps": 1240, "total_steps": 7064, "loss": 0.8592, "reward": null, "learning_rate": 4.62938983147936e-05, "epoch": 0.35, "percentage": 17.55, "elapsed_time": "3:27:54", "remaining_time": "16:16:31"} +{"current_steps": 1250, "total_steps": 7064, "loss": 0.8678, "reward": null, "learning_rate": 4.62354347325019e-05, "epoch": 0.35, "percentage": 17.7, "elapsed_time": "3:33:27", "remaining_time": "16:32:52"} +{"current_steps": 1250, "total_steps": 7064, "loss": 0.8678, "reward": null, "learning_rate": 4.62354347325019e-05, "epoch": 0.35, "percentage": 17.7, "elapsed_time": "3:29:35", "remaining_time": "16:14:51"} +{"current_steps": 1250, "total_steps": 7064, "loss": 0.8678, "reward": null, "learning_rate": 4.62354347325019e-05, "epoch": 0.35, "percentage": 17.7, "elapsed_time": "3:29:36", "remaining_time": "16:14:56"} +{"current_steps": 1250, "total_steps": 7064, "loss": 0.8678, "reward": null, "learning_rate": 4.62354347325019e-05, "epoch": 0.35, "percentage": 17.7, "elapsed_time": "3:29:34", "remaining_time": "16:14:47"} +{"current_steps": 1260, "total_steps": 7064, "loss": 0.8644, "reward": null, "learning_rate": 4.6176551141008916e-05, "epoch": 0.36, "percentage": 17.84, "elapsed_time": "3:31:14", "remaining_time": "16:13:03"} +{"current_steps": 1260, "total_steps": 7064, "loss": 0.8644, "reward": null, "learning_rate": 4.6176551141008916e-05, "epoch": 0.36, "percentage": 17.84, "elapsed_time": "3:35:06", "remaining_time": "16:30:53"} +{"current_steps": 1260, "total_steps": 7064, "loss": 0.8644, "reward": null, "learning_rate": 4.6176551141008916e-05, "epoch": 0.36, "percentage": 17.84, "elapsed_time": "3:31:15", "remaining_time": "16:13:08"} +{"current_steps": 1260, "total_steps": 7064, "loss": 0.8644, "reward": null, "learning_rate": 4.6176551141008916e-05, "epoch": 0.36, "percentage": 17.84, "elapsed_time": "3:31:13", "remaining_time": "16:12:58"} +{"current_steps": 1270, "total_steps": 7064, "loss": 0.8541, "reward": null, "learning_rate": 4.611724870495528e-05, "epoch": 0.36, "percentage": 17.98, "elapsed_time": "3:36:48", "remaining_time": "16:29:08"} +{"current_steps": 1270, "total_steps": 7064, "loss": 0.8541, "reward": null, "learning_rate": 4.611724870495528e-05, "epoch": 0.36, "percentage": 17.98, "elapsed_time": "3:32:56", "remaining_time": "16:11:28"} +{"current_steps": 1270, "total_steps": 7064, "loss": 0.8541, "reward": null, "learning_rate": 4.611724870495528e-05, "epoch": 0.36, "percentage": 17.98, "elapsed_time": "3:32:55", "remaining_time": "16:11:23"} +{"current_steps": 1270, "total_steps": 7064, "loss": 0.8541, "reward": null, "learning_rate": 4.611724870495528e-05, "epoch": 0.36, "percentage": 17.98, "elapsed_time": "3:32:57", "remaining_time": "16:11:33"} +{"current_steps": 1280, "total_steps": 7064, "loss": 0.8438, "reward": null, "learning_rate": 4.605752859726583e-05, "epoch": 0.36, "percentage": 18.12, "elapsed_time": "3:38:28", "remaining_time": "16:27:12"} +{"current_steps": 1280, "total_steps": 7064, "loss": 0.8438, "reward": null, "learning_rate": 4.605752859726583e-05, "epoch": 0.36, "percentage": 18.12, "elapsed_time": "3:34:34", "remaining_time": "16:09:38"} +{"current_steps": 1280, "total_steps": 7064, "loss": 0.8438, "reward": null, "learning_rate": 4.605752859726583e-05, "epoch": 0.36, "percentage": 18.12, "elapsed_time": "3:34:35", "remaining_time": "16:09:42"} +{"current_steps": 1280, "total_steps": 7064, "loss": 0.8438, "reward": null, "learning_rate": 4.605752859726583e-05, "epoch": 0.36, "percentage": 18.12, "elapsed_time": "3:34:36", "remaining_time": "16:09:47"} +{"current_steps": 1290, "total_steps": 7064, "loss": 0.8604, "reward": null, "learning_rate": 4.5997391999126397e-05, "epoch": 0.37, "percentage": 18.26, "elapsed_time": "3:36:15", "remaining_time": "16:07:58"} +{"current_steps": 1290, "total_steps": 7064, "loss": 0.8604, "reward": null, "learning_rate": 4.5997391999126397e-05, "epoch": 0.37, "percentage": 18.26, "elapsed_time": "3:40:08", "remaining_time": "16:25:18"} +{"current_steps": 1290, "total_steps": 7064, "loss": 0.8604, "reward": null, "learning_rate": 4.5997391999126397e-05, "epoch": 0.37, "percentage": 18.26, "elapsed_time": "3:36:14", "remaining_time": "16:07:54"} +{"current_steps": 1290, "total_steps": 7064, "loss": 0.8604, "reward": null, "learning_rate": 4.5997391999126397e-05, "epoch": 0.37, "percentage": 18.26, "elapsed_time": "3:36:16", "remaining_time": "16:08:03"} +{"current_steps": 1300, "total_steps": 7064, "loss": 0.8633, "reward": null, "learning_rate": 4.5936840099960465e-05, "epoch": 0.37, "percentage": 18.4, "elapsed_time": "3:41:48", "remaining_time": "16:23:26"} +{"current_steps": 1300, "total_steps": 7064, "loss": 0.8633, "reward": null, "learning_rate": 4.5936840099960465e-05, "epoch": 0.37, "percentage": 18.4, "elapsed_time": "3:37:56", "remaining_time": "16:06:21"} +{"current_steps": 1300, "total_steps": 7064, "loss": 0.8633, "reward": null, "learning_rate": 4.5936840099960465e-05, "epoch": 0.37, "percentage": 18.4, "elapsed_time": "3:37:55", "remaining_time": "16:06:16"} +{"current_steps": 1300, "total_steps": 7064, "loss": 0.8633, "reward": null, "learning_rate": 4.5936840099960465e-05, "epoch": 0.37, "percentage": 18.4, "elapsed_time": "3:37:54", "remaining_time": "16:06:12"} +{"current_steps": 1310, "total_steps": 7064, "loss": 0.8437, "reward": null, "learning_rate": 4.587587409740561e-05, "epoch": 0.37, "percentage": 18.54, "elapsed_time": "3:43:28", "remaining_time": "16:21:34"} +{"current_steps": 1310, "total_steps": 7064, "loss": 0.8437, "reward": null, "learning_rate": 4.587587409740561e-05, "epoch": 0.37, "percentage": 18.54, "elapsed_time": "3:39:37", "remaining_time": "16:04:39"} +{"current_steps": 1310, "total_steps": 7064, "loss": 0.8437, "reward": null, "learning_rate": 4.587587409740561e-05, "epoch": 0.37, "percentage": 18.54, "elapsed_time": "3:39:35", "remaining_time": "16:04:30"} +{"current_steps": 1310, "total_steps": 7064, "loss": 0.8437, "reward": null, "learning_rate": 4.587587409740561e-05, "epoch": 0.37, "percentage": 18.54, "elapsed_time": "3:39:36", "remaining_time": "16:04:34"} +{"current_steps": 1320, "total_steps": 7064, "loss": 0.8466, "reward": null, "learning_rate": 4.581449519728986e-05, "epoch": 0.37, "percentage": 18.69, "elapsed_time": "3:41:14", "remaining_time": "16:02:46"} +{"current_steps": 1320, "total_steps": 7064, "loss": 0.8466, "reward": null, "learning_rate": 4.581449519728986e-05, "epoch": 0.37, "percentage": 18.69, "elapsed_time": "3:41:14", "remaining_time": "16:02:42"} +{"current_steps": 1320, "total_steps": 7064, "loss": 0.8466, "reward": null, "learning_rate": 4.581449519728986e-05, "epoch": 0.37, "percentage": 18.69, "elapsed_time": "3:41:16", "remaining_time": "16:02:50"} +{"current_steps": 1320, "total_steps": 7064, "loss": 0.8466, "reward": null, "learning_rate": 4.581449519728986e-05, "epoch": 0.37, "percentage": 18.69, "elapsed_time": "3:45:07", "remaining_time": "16:19:37"} +{"current_steps": 1330, "total_steps": 7064, "loss": 0.8457, "reward": null, "learning_rate": 4.575270461360779e-05, "epoch": 0.38, "percentage": 18.83, "elapsed_time": "3:46:47", "remaining_time": "16:17:46"} +{"current_steps": 1330, "total_steps": 7064, "loss": 0.8457, "reward": null, "learning_rate": 4.575270461360779e-05, "epoch": 0.38, "percentage": 18.83, "elapsed_time": "3:42:56", "remaining_time": "16:01:09"} +{"current_steps": 1330, "total_steps": 7064, "loss": 0.8457, "reward": null, "learning_rate": 4.575270461360779e-05, "epoch": 0.38, "percentage": 18.83, "elapsed_time": "3:42:54", "remaining_time": "16:01:00"} +{"current_steps": 1330, "total_steps": 7064, "loss": 0.8457, "reward": null, "learning_rate": 4.575270461360779e-05, "epoch": 0.38, "percentage": 18.83, "elapsed_time": "3:42:55", "remaining_time": "16:01:04"} +{"current_steps": 1340, "total_steps": 7064, "loss": 0.8477, "reward": null, "learning_rate": 4.569050356849655e-05, "epoch": 0.38, "percentage": 18.97, "elapsed_time": "3:48:28", "remaining_time": "16:15:57"} +{"current_steps": 1340, "total_steps": 7064, "loss": 0.8477, "reward": null, "learning_rate": 4.569050356849655e-05, "epoch": 0.38, "percentage": 18.97, "elapsed_time": "3:44:37", "remaining_time": "15:59:29"} +{"current_steps": 1340, "total_steps": 7064, "loss": 0.8477, "reward": null, "learning_rate": 4.569050356849655e-05, "epoch": 0.38, "percentage": 18.97, "elapsed_time": "3:44:35", "remaining_time": "15:59:24"} +{"current_steps": 1340, "total_steps": 7064, "loss": 0.8477, "reward": null, "learning_rate": 4.569050356849655e-05, "epoch": 0.38, "percentage": 18.97, "elapsed_time": "3:44:35", "remaining_time": "15:59:20"} +{"current_steps": 1350, "total_steps": 7064, "loss": 0.8608, "reward": null, "learning_rate": 4.562789329221169e-05, "epoch": 0.38, "percentage": 19.11, "elapsed_time": "3:50:09", "remaining_time": "16:14:09"} +{"current_steps": 1350, "total_steps": 7064, "loss": 0.8608, "reward": null, "learning_rate": 4.562789329221169e-05, "epoch": 0.38, "percentage": 19.11, "elapsed_time": "3:46:17", "remaining_time": "15:57:50"} +{"current_steps": 1350, "total_steps": 7064, "loss": 0.8608, "reward": null, "learning_rate": 4.562789329221169e-05, "epoch": 0.38, "percentage": 19.11, "elapsed_time": "3:46:15", "remaining_time": "15:57:41"} +{"current_steps": 1350, "total_steps": 7064, "loss": 0.8608, "reward": null, "learning_rate": 4.562789329221169e-05, "epoch": 0.38, "percentage": 19.11, "elapsed_time": "3:46:16", "remaining_time": "15:57:45"} +{"current_steps": 1360, "total_steps": 7064, "loss": 0.8555, "reward": null, "learning_rate": 4.5564875023102796e-05, "epoch": 0.39, "percentage": 19.25, "elapsed_time": "3:51:48", "remaining_time": "16:12:14"} +{"current_steps": 1360, "total_steps": 7064, "loss": 0.8555, "reward": null, "learning_rate": 4.5564875023102796e-05, "epoch": 0.39, "percentage": 19.25, "elapsed_time": "3:47:55", "remaining_time": "15:55:55"} +{"current_steps": 1360, "total_steps": 7064, "loss": 0.8555, "reward": null, "learning_rate": 4.5564875023102796e-05, "epoch": 0.39, "percentage": 19.25, "elapsed_time": "3:47:56", "remaining_time": "15:55:59"} +{"current_steps": 1360, "total_steps": 7064, "loss": 0.8555, "reward": null, "learning_rate": 4.5564875023102796e-05, "epoch": 0.39, "percentage": 19.25, "elapsed_time": "3:47:57", "remaining_time": "15:56:04"} +{"current_steps": 1370, "total_steps": 7064, "loss": 0.8624, "reward": null, "learning_rate": 4.550145000758905e-05, "epoch": 0.39, "percentage": 19.39, "elapsed_time": "3:53:30", "remaining_time": "16:10:29"} +{"current_steps": 1370, "total_steps": 7064, "loss": 0.8624, "reward": null, "learning_rate": 4.550145000758905e-05, "epoch": 0.39, "percentage": 19.39, "elapsed_time": "3:49:36", "remaining_time": "15:54:19"} +{"current_steps": 1370, "total_steps": 7064, "loss": 0.8624, "reward": null, "learning_rate": 4.550145000758905e-05, "epoch": 0.39, "percentage": 19.39, "elapsed_time": "3:49:37", "remaining_time": "15:54:23"} +{"current_steps": 1370, "total_steps": 7064, "loss": 0.8624, "reward": null, "learning_rate": 4.550145000758905e-05, "epoch": 0.39, "percentage": 19.39, "elapsed_time": "3:49:38", "remaining_time": "15:54:28"} +{"current_steps": 1380, "total_steps": 7064, "loss": 0.8613, "reward": null, "learning_rate": 4.543761950013453e-05, "epoch": 0.39, "percentage": 19.54, "elapsed_time": "3:55:10", "remaining_time": "16:08:36"} +{"current_steps": 1380, "total_steps": 7064, "loss": 0.8613, "reward": null, "learning_rate": 4.543761950013453e-05, "epoch": 0.39, "percentage": 19.54, "elapsed_time": "3:51:17", "remaining_time": "15:52:39"} +{"current_steps": 1380, "total_steps": 7064, "loss": 0.8613, "reward": null, "learning_rate": 4.543761950013453e-05, "epoch": 0.39, "percentage": 19.54, "elapsed_time": "3:51:16", "remaining_time": "15:52:35"} +{"current_steps": 1380, "total_steps": 7064, "loss": 0.8613, "reward": null, "learning_rate": 4.543761950013453e-05, "epoch": 0.39, "percentage": 19.54, "elapsed_time": "3:51:18", "remaining_time": "15:52:44"} +{"current_steps": 1390, "total_steps": 7064, "loss": 0.849, "reward": null, "learning_rate": 4.537338476322341e-05, "epoch": 0.39, "percentage": 19.68, "elapsed_time": "3:56:51", "remaining_time": "16:06:50"} +{"current_steps": 1390, "total_steps": 7064, "loss": 0.849, "reward": null, "learning_rate": 4.537338476322341e-05, "epoch": 0.39, "percentage": 19.68, "elapsed_time": "3:52:57", "remaining_time": "15:50:58"} +{"current_steps": 1390, "total_steps": 7064, "loss": 0.849, "reward": null, "learning_rate": 4.537338476322341e-05, "epoch": 0.39, "percentage": 19.68, "elapsed_time": "3:52:58", "remaining_time": "15:51:01"} +{"current_steps": 1390, "total_steps": 7064, "loss": 0.849, "reward": null, "learning_rate": 4.537338476322341e-05, "epoch": 0.39, "percentage": 19.68, "elapsed_time": "3:52:59", "remaining_time": "15:51:06"} +{"current_steps": 1400, "total_steps": 7064, "loss": 0.858, "reward": null, "learning_rate": 4.530874706733502e-05, "epoch": 0.4, "percentage": 19.82, "elapsed_time": "3:58:30", "remaining_time": "16:04:57"} +{"current_steps": 1400, "total_steps": 7064, "loss": 0.858, "reward": null, "learning_rate": 4.530874706733502e-05, "epoch": 0.4, "percentage": 19.82, "elapsed_time": "3:54:39", "remaining_time": "15:49:21"} +{"current_steps": 1400, "total_steps": 7064, "loss": 0.858, "reward": null, "learning_rate": 4.530874706733502e-05, "epoch": 0.4, "percentage": 19.82, "elapsed_time": "3:54:38", "remaining_time": "15:49:17"} +{"current_steps": 1400, "total_steps": 7064, "loss": 0.858, "reward": null, "learning_rate": 4.530874706733502e-05, "epoch": 0.4, "percentage": 19.82, "elapsed_time": "3:54:37", "remaining_time": "15:49:13"} +{"current_steps": 1410, "total_steps": 7064, "loss": 0.8468, "reward": null, "learning_rate": 4.524370769091866e-05, "epoch": 0.4, "percentage": 19.96, "elapsed_time": "4:00:10", "remaining_time": "16:03:04"} +{"current_steps": 1410, "total_steps": 7064, "loss": 0.8468, "reward": null, "learning_rate": 4.524370769091866e-05, "epoch": 0.4, "percentage": 19.96, "elapsed_time": "3:56:18", "remaining_time": "15:47:32"} +{"current_steps": 1410, "total_steps": 7064, "loss": 0.8468, "reward": null, "learning_rate": 4.524370769091866e-05, "epoch": 0.4, "percentage": 19.96, "elapsed_time": "3:56:19", "remaining_time": "15:47:37"} +{"current_steps": 1410, "total_steps": 7064, "loss": 0.8468, "reward": null, "learning_rate": 4.524370769091866e-05, "epoch": 0.4, "percentage": 19.96, "elapsed_time": "3:56:17", "remaining_time": "15:47:29"} +{"current_steps": 1420, "total_steps": 7064, "loss": 0.8624, "reward": null, "learning_rate": 4.5178267920368366e-05, "epoch": 0.4, "percentage": 20.1, "elapsed_time": "4:01:50", "remaining_time": "16:01:12"} +{"current_steps": 1420, "total_steps": 7064, "loss": 0.8624, "reward": null, "learning_rate": 4.5178267920368366e-05, "epoch": 0.4, "percentage": 20.1, "elapsed_time": "3:57:58", "remaining_time": "15:45:53"} +{"current_steps": 1420, "total_steps": 7064, "loss": 0.8624, "reward": null, "learning_rate": 4.5178267920368366e-05, "epoch": 0.4, "percentage": 20.1, "elapsed_time": "3:57:57", "remaining_time": "15:45:48"} +{"current_steps": 1420, "total_steps": 7064, "loss": 0.8624, "reward": null, "learning_rate": 4.5178267920368366e-05, "epoch": 0.4, "percentage": 20.1, "elapsed_time": "3:57:56", "remaining_time": "15:45:45"} +{"current_steps": 1430, "total_steps": 7064, "loss": 0.8464, "reward": null, "learning_rate": 4.511242904999746e-05, "epoch": 0.4, "percentage": 20.24, "elapsed_time": "4:03:28", "remaining_time": "15:59:16"} +{"current_steps": 1430, "total_steps": 7064, "loss": 0.8464, "reward": null, "learning_rate": 4.511242904999746e-05, "epoch": 0.4, "percentage": 20.24, "elapsed_time": "3:59:37", "remaining_time": "15:44:04"} +{"current_steps": 1430, "total_steps": 7064, "loss": 0.8464, "reward": null, "learning_rate": 4.511242904999746e-05, "epoch": 0.4, "percentage": 20.24, "elapsed_time": "3:59:36", "remaining_time": "15:44:00"} +{"current_steps": 1430, "total_steps": 7064, "loss": 0.8464, "reward": null, "learning_rate": 4.511242904999746e-05, "epoch": 0.4, "percentage": 20.24, "elapsed_time": "3:59:35", "remaining_time": "15:43:57"} +{"current_steps": 1440, "total_steps": 7064, "loss": 0.8575, "reward": null, "learning_rate": 4.50461923820129e-05, "epoch": 0.41, "percentage": 20.39, "elapsed_time": "4:05:10", "remaining_time": "15:57:31"} +{"current_steps": 1440, "total_steps": 7064, "loss": 0.8575, "reward": null, "learning_rate": 4.50461923820129e-05, "epoch": 0.41, "percentage": 20.39, "elapsed_time": "4:01:17", "remaining_time": "15:42:24"} +{"current_steps": 1440, "total_steps": 7064, "loss": 0.8575, "reward": null, "learning_rate": 4.50461923820129e-05, "epoch": 0.41, "percentage": 20.39, "elapsed_time": "4:01:16", "remaining_time": "15:42:20"} +{"current_steps": 1440, "total_steps": 7064, "loss": 0.8575, "reward": null, "learning_rate": 4.50461923820129e-05, "epoch": 0.41, "percentage": 20.39, "elapsed_time": "4:01:18", "remaining_time": "15:42:28"} +{"current_steps": 1450, "total_steps": 7064, "loss": 0.8587, "reward": null, "learning_rate": 4.497955922648961e-05, "epoch": 0.41, "percentage": 20.53, "elapsed_time": "4:06:53", "remaining_time": "15:55:52"} +{"current_steps": 1450, "total_steps": 7064, "loss": 0.8587, "reward": null, "learning_rate": 4.497955922648961e-05, "epoch": 0.41, "percentage": 20.53, "elapsed_time": "4:03:00", "remaining_time": "15:40:53"} +{"current_steps": 1450, "total_steps": 7064, "loss": 0.8587, "reward": null, "learning_rate": 4.497955922648961e-05, "epoch": 0.41, "percentage": 20.53, "elapsed_time": "4:03:01", "remaining_time": "15:40:57"} +{"current_steps": 1450, "total_steps": 7064, "loss": 0.8587, "reward": null, "learning_rate": 4.497955922648961e-05, "epoch": 0.41, "percentage": 20.53, "elapsed_time": "4:02:59", "remaining_time": "15:40:49"} +{"current_steps": 1460, "total_steps": 7064, "loss": 0.8517, "reward": null, "learning_rate": 4.491253090134447e-05, "epoch": 0.41, "percentage": 20.67, "elapsed_time": "4:08:34", "remaining_time": "15:54:05"} +{"current_steps": 1460, "total_steps": 7064, "loss": 0.8517, "reward": null, "learning_rate": 4.491253090134447e-05, "epoch": 0.41, "percentage": 20.67, "elapsed_time": "4:04:40", "remaining_time": "15:39:09"} +{"current_steps": 1460, "total_steps": 7064, "loss": 0.8517, "reward": null, "learning_rate": 4.491253090134447e-05, "epoch": 0.41, "percentage": 20.67, "elapsed_time": "4:04:42", "remaining_time": "15:39:17"} +{"current_steps": 1460, "total_steps": 7064, "loss": 0.8517, "reward": null, "learning_rate": 4.491253090134447e-05, "epoch": 0.41, "percentage": 20.67, "elapsed_time": "4:04:41", "remaining_time": "15:39:13"} +{"current_steps": 1470, "total_steps": 7064, "loss": 0.8427, "reward": null, "learning_rate": 4.4845108732310355e-05, "epoch": 0.42, "percentage": 20.81, "elapsed_time": "4:10:15", "remaining_time": "15:52:21"} +{"current_steps": 1470, "total_steps": 7064, "loss": 0.8427, "reward": null, "learning_rate": 4.4845108732310355e-05, "epoch": 0.42, "percentage": 20.81, "elapsed_time": "4:06:24", "remaining_time": "15:37:41"} +{"current_steps": 1470, "total_steps": 7064, "loss": 0.8427, "reward": null, "learning_rate": 4.4845108732310355e-05, "epoch": 0.42, "percentage": 20.81, "elapsed_time": "4:06:23", "remaining_time": "15:37:37"} +{"current_steps": 1470, "total_steps": 7064, "loss": 0.8427, "reward": null, "learning_rate": 4.4845108732310355e-05, "epoch": 0.42, "percentage": 20.81, "elapsed_time": "4:06:22", "remaining_time": "15:37:33"} +{"current_steps": 1480, "total_steps": 7064, "loss": 0.8588, "reward": null, "learning_rate": 4.4777294052909804e-05, "epoch": 0.42, "percentage": 20.95, "elapsed_time": "4:08:08", "remaining_time": "15:36:12"} +{"current_steps": 1480, "total_steps": 7064, "loss": 0.8588, "reward": null, "learning_rate": 4.4777294052909804e-05, "epoch": 0.42, "percentage": 20.95, "elapsed_time": "4:08:06", "remaining_time": "15:36:04"} +{"current_steps": 1480, "total_steps": 7064, "loss": 0.8588, "reward": null, "learning_rate": 4.4777294052909804e-05, "epoch": 0.42, "percentage": 20.95, "elapsed_time": "4:08:07", "remaining_time": "15:36:08"} +{"current_steps": 1480, "total_steps": 7064, "loss": 0.8588, "reward": null, "learning_rate": 4.4777294052909804e-05, "epoch": 0.42, "percentage": 20.95, "elapsed_time": "4:11:59", "remaining_time": "15:50:45"} +{"current_steps": 1490, "total_steps": 7064, "loss": 0.8516, "reward": null, "learning_rate": 4.470908820442873e-05, "epoch": 0.42, "percentage": 21.09, "elapsed_time": "4:13:37", "remaining_time": "15:48:46"} +{"current_steps": 1490, "total_steps": 7064, "loss": 0.8516, "reward": null, "learning_rate": 4.470908820442873e-05, "epoch": 0.42, "percentage": 21.09, "elapsed_time": "4:09:43", "remaining_time": "15:34:13"} +{"current_steps": 1490, "total_steps": 7064, "loss": 0.8516, "reward": null, "learning_rate": 4.470908820442873e-05, "epoch": 0.42, "percentage": 21.09, "elapsed_time": "4:09:45", "remaining_time": "15:34:21"} +{"current_steps": 1490, "total_steps": 7064, "loss": 0.8516, "reward": null, "learning_rate": 4.470908820442873e-05, "epoch": 0.42, "percentage": 21.09, "elapsed_time": "4:09:44", "remaining_time": "15:34:16"} +{"current_steps": 1500, "total_steps": 7064, "loss": 0.8408, "reward": null, "learning_rate": 4.464049253588985e-05, "epoch": 0.42, "percentage": 21.23, "elapsed_time": "4:11:24", "remaining_time": "15:32:33"} +{"current_steps": 1500, "total_steps": 7064, "loss": 0.8408, "reward": null, "learning_rate": 4.464049253588985e-05, "epoch": 0.42, "percentage": 21.23, "elapsed_time": "4:11:23", "remaining_time": "15:32:29"} +{"current_steps": 1500, "total_steps": 7064, "loss": 0.8408, "reward": null, "learning_rate": 4.464049253588985e-05, "epoch": 0.42, "percentage": 21.23, "elapsed_time": "4:11:22", "remaining_time": "15:32:26"} +{"current_steps": 1500, "total_steps": 7064, "loss": 0.8408, "reward": null, "learning_rate": 4.464049253588985e-05, "epoch": 0.42, "percentage": 21.23, "elapsed_time": "4:15:15", "remaining_time": "15:46:51"} +{"current_steps": 1510, "total_steps": 7064, "loss": 0.8513, "reward": null, "learning_rate": 4.457150840402604e-05, "epoch": 0.43, "percentage": 21.38, "elapsed_time": "4:13:05", "remaining_time": "15:30:54"} +{"current_steps": 1510, "total_steps": 7064, "loss": 0.8513, "reward": null, "learning_rate": 4.457150840402604e-05, "epoch": 0.43, "percentage": 21.38, "elapsed_time": "4:16:57", "remaining_time": "15:45:09"} +{"current_steps": 1510, "total_steps": 7064, "loss": 0.8513, "reward": null, "learning_rate": 4.457150840402604e-05, "epoch": 0.43, "percentage": 21.38, "elapsed_time": "4:13:06", "remaining_time": "15:30:58"} +{"current_steps": 1510, "total_steps": 7064, "loss": 0.8513, "reward": null, "learning_rate": 4.457150840402604e-05, "epoch": 0.43, "percentage": 21.38, "elapsed_time": "4:13:04", "remaining_time": "15:30:51"} +{"current_steps": 1520, "total_steps": 7064, "loss": 0.8554, "reward": null, "learning_rate": 4.450213717325343e-05, "epoch": 0.43, "percentage": 21.52, "elapsed_time": "4:18:38", "remaining_time": "15:43:21"} +{"current_steps": 1520, "total_steps": 7064, "loss": 0.8554, "reward": null, "learning_rate": 4.450213717325343e-05, "epoch": 0.43, "percentage": 21.52, "elapsed_time": "4:14:47", "remaining_time": "15:29:17"} +{"current_steps": 1520, "total_steps": 7064, "loss": 0.8554, "reward": null, "learning_rate": 4.450213717325343e-05, "epoch": 0.43, "percentage": 21.52, "elapsed_time": "4:14:46", "remaining_time": "15:29:13"} +{"current_steps": 1520, "total_steps": 7064, "loss": 0.8554, "reward": null, "learning_rate": 4.450213717325343e-05, "epoch": 0.43, "percentage": 21.52, "elapsed_time": "4:14:45", "remaining_time": "15:29:10"} +{"current_steps": 1530, "total_steps": 7064, "loss": 0.8598, "reward": null, "learning_rate": 4.443238021564448e-05, "epoch": 0.43, "percentage": 21.66, "elapsed_time": "4:20:19", "remaining_time": "15:41:35"} +{"current_steps": 1530, "total_steps": 7064, "loss": 0.8598, "reward": null, "learning_rate": 4.443238021564448e-05, "epoch": 0.43, "percentage": 21.66, "elapsed_time": "4:16:27", "remaining_time": "15:27:34"} +{"current_steps": 1530, "total_steps": 7064, "loss": 0.8598, "reward": null, "learning_rate": 4.443238021564448e-05, "epoch": 0.43, "percentage": 21.66, "elapsed_time": "4:16:28", "remaining_time": "15:27:38"} +{"current_steps": 1530, "total_steps": 7064, "loss": 0.8598, "reward": null, "learning_rate": 4.443238021564448e-05, "epoch": 0.43, "percentage": 21.66, "elapsed_time": "4:16:26", "remaining_time": "15:27:31"} +{"current_steps": 1540, "total_steps": 7064, "loss": 0.8495, "reward": null, "learning_rate": 4.4362238910900835e-05, "epoch": 0.44, "percentage": 21.8, "elapsed_time": "4:21:58", "remaining_time": "15:39:41"} +{"current_steps": 1540, "total_steps": 7064, "loss": 0.8495, "reward": null, "learning_rate": 4.4362238910900835e-05, "epoch": 0.44, "percentage": 21.8, "elapsed_time": "4:18:05", "remaining_time": "15:25:48"} +{"current_steps": 1540, "total_steps": 7064, "loss": 0.8495, "reward": null, "learning_rate": 4.4362238910900835e-05, "epoch": 0.44, "percentage": 21.8, "elapsed_time": "4:18:05", "remaining_time": "15:25:44"} +{"current_steps": 1540, "total_steps": 7064, "loss": 0.8495, "reward": null, "learning_rate": 4.4362238910900835e-05, "epoch": 0.44, "percentage": 21.8, "elapsed_time": "4:18:07", "remaining_time": "15:25:52"} +{"current_steps": 1550, "total_steps": 7064, "loss": 0.8338, "reward": null, "learning_rate": 4.4291714646326024e-05, "epoch": 0.44, "percentage": 21.94, "elapsed_time": "4:23:38", "remaining_time": "15:37:52"} +{"current_steps": 1550, "total_steps": 7064, "loss": 0.8338, "reward": null, "learning_rate": 4.4291714646326024e-05, "epoch": 0.44, "percentage": 21.94, "elapsed_time": "4:19:46", "remaining_time": "15:24:09"} +{"current_steps": 1550, "total_steps": 7064, "loss": 0.8338, "reward": null, "learning_rate": 4.4291714646326024e-05, "epoch": 0.44, "percentage": 21.94, "elapsed_time": "4:19:45", "remaining_time": "15:24:05"} +{"current_steps": 1550, "total_steps": 7064, "loss": 0.8338, "reward": null, "learning_rate": 4.4291714646326024e-05, "epoch": 0.44, "percentage": 21.94, "elapsed_time": "4:19:44", "remaining_time": "15:24:02"} +{"current_steps": 1560, "total_steps": 7064, "loss": 0.8576, "reward": null, "learning_rate": 4.4220808816797995e-05, "epoch": 0.44, "percentage": 22.08, "elapsed_time": "4:25:21", "remaining_time": "15:36:14"} +{"current_steps": 1560, "total_steps": 7064, "loss": 0.8576, "reward": null, "learning_rate": 4.4220808816797995e-05, "epoch": 0.44, "percentage": 22.08, "elapsed_time": "4:21:28", "remaining_time": "15:22:31"} +{"current_steps": 1560, "total_steps": 7064, "loss": 0.8576, "reward": null, "learning_rate": 4.4220808816797995e-05, "epoch": 0.44, "percentage": 22.08, "elapsed_time": "4:21:29", "remaining_time": "15:22:34"} +{"current_steps": 1560, "total_steps": 7064, "loss": 0.8576, "reward": null, "learning_rate": 4.4220808816797995e-05, "epoch": 0.44, "percentage": 22.08, "elapsed_time": "4:21:30", "remaining_time": "15:22:38"} +{"current_steps": 1570, "total_steps": 7064, "loss": 0.8593, "reward": null, "learning_rate": 4.414952282474158e-05, "epoch": 0.44, "percentage": 22.23, "elapsed_time": "4:27:02", "remaining_time": "15:34:27"} +{"current_steps": 1570, "total_steps": 7064, "loss": 0.8593, "reward": null, "learning_rate": 4.414952282474158e-05, "epoch": 0.44, "percentage": 22.23, "elapsed_time": "4:23:09", "remaining_time": "15:20:54"} +{"current_steps": 1570, "total_steps": 7064, "loss": 0.8593, "reward": null, "learning_rate": 4.414952282474158e-05, "epoch": 0.44, "percentage": 22.23, "elapsed_time": "4:23:08", "remaining_time": "15:20:51"} +{"current_steps": 1570, "total_steps": 7064, "loss": 0.8593, "reward": null, "learning_rate": 4.414952282474158e-05, "epoch": 0.44, "percentage": 22.23, "elapsed_time": "4:23:10", "remaining_time": "15:20:58"} +{"current_steps": 1580, "total_steps": 7064, "loss": 0.8534, "reward": null, "learning_rate": 4.407785808010073e-05, "epoch": 0.45, "percentage": 22.37, "elapsed_time": "4:24:51", "remaining_time": "15:19:17"} +{"current_steps": 1580, "total_steps": 7064, "loss": 0.8534, "reward": null, "learning_rate": 4.407785808010073e-05, "epoch": 0.45, "percentage": 22.37, "elapsed_time": "4:24:50", "remaining_time": "15:19:13"} +{"current_steps": 1580, "total_steps": 7064, "loss": 0.8534, "reward": null, "learning_rate": 4.407785808010073e-05, "epoch": 0.45, "percentage": 22.37, "elapsed_time": "4:24:49", "remaining_time": "15:19:10"} +{"current_steps": 1580, "total_steps": 7064, "loss": 0.8534, "reward": null, "learning_rate": 4.407785808010073e-05, "epoch": 0.45, "percentage": 22.37, "elapsed_time": "4:28:42", "remaining_time": "15:32:40"} +{"current_steps": 1590, "total_steps": 7064, "loss": 0.8564, "reward": null, "learning_rate": 4.400581600031062e-05, "epoch": 0.45, "percentage": 22.51, "elapsed_time": "4:30:23", "remaining_time": "15:30:52"} +{"current_steps": 1590, "total_steps": 7064, "loss": 0.8564, "reward": null, "learning_rate": 4.400581600031062e-05, "epoch": 0.45, "percentage": 22.51, "elapsed_time": "4:26:31", "remaining_time": "15:17:36"} +{"current_steps": 1590, "total_steps": 7064, "loss": 0.8564, "reward": null, "learning_rate": 4.400581600031062e-05, "epoch": 0.45, "percentage": 22.51, "elapsed_time": "4:26:30", "remaining_time": "15:17:32"} +{"current_steps": 1590, "total_steps": 7064, "loss": 0.8564, "reward": null, "learning_rate": 4.400581600031062e-05, "epoch": 0.45, "percentage": 22.51, "elapsed_time": "4:26:29", "remaining_time": "15:17:29"} +{"current_steps": 1600, "total_steps": 7064, "loss": 0.8446, "reward": null, "learning_rate": 4.3933398010269614e-05, "epoch": 0.45, "percentage": 22.65, "elapsed_time": "4:32:03", "remaining_time": "15:29:06"} +{"current_steps": 1600, "total_steps": 7064, "loss": 0.8446, "reward": null, "learning_rate": 4.3933398010269614e-05, "epoch": 0.45, "percentage": 22.65, "elapsed_time": "4:28:12", "remaining_time": "15:15:56"} +{"current_steps": 1600, "total_steps": 7064, "loss": 0.8446, "reward": null, "learning_rate": 4.3933398010269614e-05, "epoch": 0.45, "percentage": 22.65, "elapsed_time": "4:28:11", "remaining_time": "15:15:52"} +{"current_steps": 1600, "total_steps": 7064, "loss": 0.8446, "reward": null, "learning_rate": 4.3933398010269614e-05, "epoch": 0.45, "percentage": 22.65, "elapsed_time": "4:28:10", "remaining_time": "15:15:49"} +{"current_steps": 1610, "total_steps": 7064, "loss": 0.8445, "reward": null, "learning_rate": 4.386060554231111e-05, "epoch": 0.46, "percentage": 22.79, "elapsed_time": "4:33:44", "remaining_time": "15:27:19"} +{"current_steps": 1610, "total_steps": 7064, "loss": 0.8445, "reward": null, "learning_rate": 4.386060554231111e-05, "epoch": 0.46, "percentage": 22.79, "elapsed_time": "4:29:51", "remaining_time": "15:14:09"} +{"current_steps": 1610, "total_steps": 7064, "loss": 0.8445, "reward": null, "learning_rate": 4.386060554231111e-05, "epoch": 0.46, "percentage": 22.79, "elapsed_time": "4:29:52", "remaining_time": "15:14:12"} +{"current_steps": 1610, "total_steps": 7064, "loss": 0.8445, "reward": null, "learning_rate": 4.386060554231111e-05, "epoch": 0.46, "percentage": 22.79, "elapsed_time": "4:29:53", "remaining_time": "15:14:16"} +{"current_steps": 1620, "total_steps": 7064, "loss": 0.8281, "reward": null, "learning_rate": 4.378744003617517e-05, "epoch": 0.46, "percentage": 22.93, "elapsed_time": "4:31:36", "remaining_time": "15:12:44"} +{"current_steps": 1620, "total_steps": 7064, "loss": 0.8281, "reward": null, "learning_rate": 4.378744003617517e-05, "epoch": 0.46, "percentage": 22.93, "elapsed_time": "4:31:38", "remaining_time": "15:12:51"} +{"current_steps": 1620, "total_steps": 7064, "loss": 0.8281, "reward": null, "learning_rate": 4.378744003617517e-05, "epoch": 0.46, "percentage": 22.93, "elapsed_time": "4:31:37", "remaining_time": "15:12:47"} +{"current_steps": 1620, "total_steps": 7064, "loss": 0.8281, "reward": null, "learning_rate": 4.378744003617517e-05, "epoch": 0.46, "percentage": 22.93, "elapsed_time": "4:35:29", "remaining_time": "15:25:48"} +{"current_steps": 1630, "total_steps": 7064, "loss": 0.8449, "reward": null, "learning_rate": 4.371390293898007e-05, "epoch": 0.46, "percentage": 23.07, "elapsed_time": "4:33:19", "remaining_time": "15:11:12"} +{"current_steps": 1630, "total_steps": 7064, "loss": 0.8449, "reward": null, "learning_rate": 4.371390293898007e-05, "epoch": 0.46, "percentage": 23.07, "elapsed_time": "4:33:21", "remaining_time": "15:11:19"} +{"current_steps": 1630, "total_steps": 7064, "loss": 0.8449, "reward": null, "learning_rate": 4.371390293898007e-05, "epoch": 0.46, "percentage": 23.07, "elapsed_time": "4:33:20", "remaining_time": "15:11:15"} +{"current_steps": 1630, "total_steps": 7064, "loss": 0.8449, "reward": null, "learning_rate": 4.371390293898007e-05, "epoch": 0.46, "percentage": 23.07, "elapsed_time": "4:37:13", "remaining_time": "15:24:10"} +{"current_steps": 1640, "total_steps": 7064, "loss": 0.8405, "reward": null, "learning_rate": 4.3639995705193684e-05, "epoch": 0.46, "percentage": 23.22, "elapsed_time": "4:38:53", "remaining_time": "15:22:24"} +{"current_steps": 1640, "total_steps": 7064, "loss": 0.8405, "reward": null, "learning_rate": 4.3639995705193684e-05, "epoch": 0.46, "percentage": 23.22, "elapsed_time": "4:35:02", "remaining_time": "15:09:39"} +{"current_steps": 1640, "total_steps": 7064, "loss": 0.8405, "reward": null, "learning_rate": 4.3639995705193684e-05, "epoch": 0.46, "percentage": 23.22, "elapsed_time": "4:35:01", "remaining_time": "15:09:36"} +{"current_steps": 1640, "total_steps": 7064, "loss": 0.8405, "reward": null, "learning_rate": 4.3639995705193684e-05, "epoch": 0.46, "percentage": 23.22, "elapsed_time": "4:35:00", "remaining_time": "15:09:32"} +{"current_steps": 1650, "total_steps": 7064, "loss": 0.8349, "reward": null, "learning_rate": 4.3565719796604706e-05, "epoch": 0.47, "percentage": 23.36, "elapsed_time": "4:36:40", "remaining_time": "15:07:51"} +{"current_steps": 1650, "total_steps": 7064, "loss": 0.8349, "reward": null, "learning_rate": 4.3565719796604706e-05, "epoch": 0.47, "percentage": 23.36, "elapsed_time": "4:36:42", "remaining_time": "15:07:54"} +{"current_steps": 1650, "total_steps": 7064, "loss": 0.8349, "reward": null, "learning_rate": 4.3565719796604706e-05, "epoch": 0.47, "percentage": 23.36, "elapsed_time": "4:36:40", "remaining_time": "15:07:48"} +{"current_steps": 1650, "total_steps": 7064, "loss": 0.8349, "reward": null, "learning_rate": 4.3565719796604706e-05, "epoch": 0.47, "percentage": 23.36, "elapsed_time": "4:40:33", "remaining_time": "15:20:33"} +{"current_steps": 1660, "total_steps": 7064, "loss": 0.8311, "reward": null, "learning_rate": 4.3491076682293715e-05, "epoch": 0.47, "percentage": 23.5, "elapsed_time": "4:42:15", "remaining_time": "15:18:51"} +{"current_steps": 1660, "total_steps": 7064, "loss": 0.8311, "reward": null, "learning_rate": 4.3491076682293715e-05, "epoch": 0.47, "percentage": 23.5, "elapsed_time": "4:38:22", "remaining_time": "15:06:14"} +{"current_steps": 1660, "total_steps": 7064, "loss": 0.8311, "reward": null, "learning_rate": 4.3491076682293715e-05, "epoch": 0.47, "percentage": 23.5, "elapsed_time": "4:38:21", "remaining_time": "15:06:11"} +{"current_steps": 1660, "total_steps": 7064, "loss": 0.8311, "reward": null, "learning_rate": 4.3491076682293715e-05, "epoch": 0.47, "percentage": 23.5, "elapsed_time": "4:38:23", "remaining_time": "15:06:18"} +{"current_steps": 1670, "total_steps": 7064, "loss": 0.8383, "reward": null, "learning_rate": 4.341606783860416e-05, "epoch": 0.47, "percentage": 23.64, "elapsed_time": "4:43:55", "remaining_time": "15:17:02"} +{"current_steps": 1670, "total_steps": 7064, "loss": 0.8383, "reward": null, "learning_rate": 4.341606783860416e-05, "epoch": 0.47, "percentage": 23.64, "elapsed_time": "4:40:03", "remaining_time": "15:04:35"} +{"current_steps": 1670, "total_steps": 7064, "loss": 0.8383, "reward": null, "learning_rate": 4.341606783860416e-05, "epoch": 0.47, "percentage": 23.64, "elapsed_time": "4:40:02", "remaining_time": "15:04:31"} +{"current_steps": 1670, "total_steps": 7064, "loss": 0.8383, "reward": null, "learning_rate": 4.341606783860416e-05, "epoch": 0.47, "percentage": 23.64, "elapsed_time": "4:40:01", "remaining_time": "15:04:28"} +{"current_steps": 1680, "total_steps": 7064, "loss": 0.8313, "reward": null, "learning_rate": 4.334069474911313e-05, "epoch": 0.48, "percentage": 23.78, "elapsed_time": "4:45:34", "remaining_time": "15:15:12"} +{"current_steps": 1680, "total_steps": 7064, "loss": 0.8313, "reward": null, "learning_rate": 4.334069474911313e-05, "epoch": 0.48, "percentage": 23.78, "elapsed_time": "4:41:42", "remaining_time": "15:02:48"} +{"current_steps": 1680, "total_steps": 7064, "loss": 0.8313, "reward": null, "learning_rate": 4.334069474911313e-05, "epoch": 0.48, "percentage": 23.78, "elapsed_time": "4:41:41", "remaining_time": "15:02:45"} +{"current_steps": 1680, "total_steps": 7064, "loss": 0.8313, "reward": null, "learning_rate": 4.334069474911313e-05, "epoch": 0.48, "percentage": 23.78, "elapsed_time": "4:41:43", "remaining_time": "15:02:51"} +{"current_steps": 1690, "total_steps": 7064, "loss": 0.8424, "reward": null, "learning_rate": 4.326495890460204e-05, "epoch": 0.48, "percentage": 23.92, "elapsed_time": "4:47:14", "remaining_time": "15:13:22"} +{"current_steps": 1690, "total_steps": 7064, "loss": 0.8424, "reward": null, "learning_rate": 4.326495890460204e-05, "epoch": 0.48, "percentage": 23.92, "elapsed_time": "4:43:22", "remaining_time": "15:01:06"} +{"current_steps": 1690, "total_steps": 7064, "loss": 0.8424, "reward": null, "learning_rate": 4.326495890460204e-05, "epoch": 0.48, "percentage": 23.92, "elapsed_time": "4:43:21", "remaining_time": "15:01:03"} +{"current_steps": 1690, "total_steps": 7064, "loss": 0.8424, "reward": null, "learning_rate": 4.326495890460204e-05, "epoch": 0.48, "percentage": 23.92, "elapsed_time": "4:43:20", "remaining_time": "15:01:00"} +{"current_steps": 1700, "total_steps": 7064, "loss": 0.8323, "reward": null, "learning_rate": 4.3188861803027094e-05, "epoch": 0.48, "percentage": 24.07, "elapsed_time": "4:45:00", "remaining_time": "14:59:17"} +{"current_steps": 1700, "total_steps": 7064, "loss": 0.8323, "reward": null, "learning_rate": 4.3188861803027094e-05, "epoch": 0.48, "percentage": 24.07, "elapsed_time": "4:45:01", "remaining_time": "14:59:20"} +{"current_steps": 1700, "total_steps": 7064, "loss": 0.8323, "reward": null, "learning_rate": 4.3188861803027094e-05, "epoch": 0.48, "percentage": 24.07, "elapsed_time": "4:44:59", "remaining_time": "14:59:14"} +{"current_steps": 1700, "total_steps": 7064, "loss": 0.8323, "reward": null, "learning_rate": 4.3188861803027094e-05, "epoch": 0.48, "percentage": 24.07, "elapsed_time": "4:48:52", "remaining_time": "15:11:30"} +{"current_steps": 1710, "total_steps": 7064, "loss": 0.8501, "reward": null, "learning_rate": 4.3112404949489715e-05, "epoch": 0.48, "percentage": 24.21, "elapsed_time": "4:46:40", "remaining_time": "14:57:33"} +{"current_steps": 1710, "total_steps": 7064, "loss": 0.8501, "reward": null, "learning_rate": 4.3112404949489715e-05, "epoch": 0.48, "percentage": 24.21, "elapsed_time": "4:46:41", "remaining_time": "14:57:37"} +{"current_steps": 1710, "total_steps": 7064, "loss": 0.8501, "reward": null, "learning_rate": 4.3112404949489715e-05, "epoch": 0.48, "percentage": 24.21, "elapsed_time": "4:46:39", "remaining_time": "14:57:30"} +{"current_steps": 1710, "total_steps": 7064, "loss": 0.8501, "reward": null, "learning_rate": 4.3112404949489715e-05, "epoch": 0.48, "percentage": 24.21, "elapsed_time": "4:50:32", "remaining_time": "15:09:41"} +{"current_steps": 1720, "total_steps": 7064, "loss": 0.8399, "reward": null, "learning_rate": 4.303558985620673e-05, "epoch": 0.49, "percentage": 24.35, "elapsed_time": "4:52:12", "remaining_time": "15:07:53"} +{"current_steps": 1720, "total_steps": 7064, "loss": 0.8399, "reward": null, "learning_rate": 4.303558985620673e-05, "epoch": 0.49, "percentage": 24.35, "elapsed_time": "4:48:20", "remaining_time": "14:55:51"} +{"current_steps": 1720, "total_steps": 7064, "loss": 0.8399, "reward": null, "learning_rate": 4.303558985620673e-05, "epoch": 0.49, "percentage": 24.35, "elapsed_time": "4:48:21", "remaining_time": "14:55:54"} +{"current_steps": 1720, "total_steps": 7064, "loss": 0.8399, "reward": null, "learning_rate": 4.303558985620673e-05, "epoch": 0.49, "percentage": 24.35, "elapsed_time": "4:48:19", "remaining_time": "14:55:48"} +{"current_steps": 1730, "total_steps": 7064, "loss": 0.8184, "reward": null, "learning_rate": 4.2958418042480506e-05, "epoch": 0.49, "percentage": 24.49, "elapsed_time": "4:53:49", "remaining_time": "15:05:57"} +{"current_steps": 1730, "total_steps": 7064, "loss": 0.8184, "reward": null, "learning_rate": 4.2958418042480506e-05, "epoch": 0.49, "percentage": 24.49, "elapsed_time": "4:49:58", "remaining_time": "14:54:04"} +{"current_steps": 1730, "total_steps": 7064, "loss": 0.8184, "reward": null, "learning_rate": 4.2958418042480506e-05, "epoch": 0.49, "percentage": 24.49, "elapsed_time": "4:49:57", "remaining_time": "14:54:00"} +{"current_steps": 1730, "total_steps": 7064, "loss": 0.8184, "reward": null, "learning_rate": 4.2958418042480506e-05, "epoch": 0.49, "percentage": 24.49, "elapsed_time": "4:49:56", "remaining_time": "14:53:57"} +{"current_steps": 1740, "total_steps": 7064, "loss": 0.8418, "reward": null, "learning_rate": 4.288089103466886e-05, "epoch": 0.49, "percentage": 24.63, "elapsed_time": "4:55:30", "remaining_time": "15:04:12"} +{"current_steps": 1740, "total_steps": 7064, "loss": 0.8418, "reward": null, "learning_rate": 4.288089103466886e-05, "epoch": 0.49, "percentage": 24.63, "elapsed_time": "4:51:39", "remaining_time": "14:52:25"} +{"current_steps": 1740, "total_steps": 7064, "loss": 0.8418, "reward": null, "learning_rate": 4.288089103466886e-05, "epoch": 0.49, "percentage": 24.63, "elapsed_time": "4:51:37", "remaining_time": "14:52:18"} +{"current_steps": 1740, "total_steps": 7064, "loss": 0.8418, "reward": null, "learning_rate": 4.288089103466886e-05, "epoch": 0.49, "percentage": 24.63, "elapsed_time": "4:51:38", "remaining_time": "14:52:21"} +{"current_steps": 1750, "total_steps": 7064, "loss": 0.828, "reward": null, "learning_rate": 4.280301036615489e-05, "epoch": 0.5, "percentage": 24.77, "elapsed_time": "4:57:09", "remaining_time": "15:02:19"} +{"current_steps": 1750, "total_steps": 7064, "loss": 0.828, "reward": null, "learning_rate": 4.280301036615489e-05, "epoch": 0.5, "percentage": 24.77, "elapsed_time": "4:53:17", "remaining_time": "14:50:37"} +{"current_steps": 1750, "total_steps": 7064, "loss": 0.828, "reward": null, "learning_rate": 4.280301036615489e-05, "epoch": 0.5, "percentage": 24.77, "elapsed_time": "4:53:16", "remaining_time": "14:50:33"} +{"current_steps": 1750, "total_steps": 7064, "loss": 0.828, "reward": null, "learning_rate": 4.280301036615489e-05, "epoch": 0.5, "percentage": 24.77, "elapsed_time": "4:53:15", "remaining_time": "14:50:30"} +{"current_steps": 1760, "total_steps": 7064, "loss": 0.836, "reward": null, "learning_rate": 4.272477757731662e-05, "epoch": 0.5, "percentage": 24.92, "elapsed_time": "4:54:55", "remaining_time": "14:48:47"} +{"current_steps": 1760, "total_steps": 7064, "loss": 0.836, "reward": null, "learning_rate": 4.272477757731662e-05, "epoch": 0.5, "percentage": 24.92, "elapsed_time": "4:54:54", "remaining_time": "14:48:45"} +{"current_steps": 1760, "total_steps": 7064, "loss": 0.836, "reward": null, "learning_rate": 4.272477757731662e-05, "epoch": 0.5, "percentage": 24.92, "elapsed_time": "4:54:56", "remaining_time": "14:48:51"} +{"current_steps": 1760, "total_steps": 7064, "loss": 0.836, "reward": null, "learning_rate": 4.272477757731662e-05, "epoch": 0.5, "percentage": 24.92, "elapsed_time": "4:58:47", "remaining_time": "15:00:28"} +{"current_steps": 1770, "total_steps": 7064, "loss": 0.825, "reward": null, "learning_rate": 4.2646194215496595e-05, "epoch": 0.5, "percentage": 25.06, "elapsed_time": "5:00:27", "remaining_time": "14:58:39"} +{"current_steps": 1770, "total_steps": 7064, "loss": 0.825, "reward": null, "learning_rate": 4.2646194215496595e-05, "epoch": 0.5, "percentage": 25.06, "elapsed_time": "4:56:34", "remaining_time": "14:47:01"} +{"current_steps": 1770, "total_steps": 7064, "loss": 0.825, "reward": null, "learning_rate": 4.2646194215496595e-05, "epoch": 0.5, "percentage": 25.06, "elapsed_time": "4:56:35", "remaining_time": "14:47:04"} +{"current_steps": 1770, "total_steps": 7064, "loss": 0.825, "reward": null, "learning_rate": 4.2646194215496595e-05, "epoch": 0.5, "percentage": 25.06, "elapsed_time": "4:56:36", "remaining_time": "14:47:07"} +{"current_steps": 1780, "total_steps": 7064, "loss": 0.8357, "reward": null, "learning_rate": 4.2567261834971206e-05, "epoch": 0.5, "percentage": 25.2, "elapsed_time": "4:58:15", "remaining_time": "14:45:22"} +{"current_steps": 1780, "total_steps": 7064, "loss": 0.8357, "reward": null, "learning_rate": 4.2567261834971206e-05, "epoch": 0.5, "percentage": 25.2, "elapsed_time": "5:02:06", "remaining_time": "14:56:48"} +{"current_steps": 1780, "total_steps": 7064, "loss": 0.8357, "reward": null, "learning_rate": 4.2567261834971206e-05, "epoch": 0.5, "percentage": 25.2, "elapsed_time": "4:58:13", "remaining_time": "14:45:16"} +{"current_steps": 1780, "total_steps": 7064, "loss": 0.8357, "reward": null, "learning_rate": 4.2567261834971206e-05, "epoch": 0.5, "percentage": 25.2, "elapsed_time": "4:58:13", "remaining_time": "14:45:18"} +{"current_steps": 1790, "total_steps": 7064, "loss": 0.8498, "reward": null, "learning_rate": 4.248798199691998e-05, "epoch": 0.51, "percentage": 25.34, "elapsed_time": "5:03:47", "remaining_time": "14:55:03"} +{"current_steps": 1790, "total_steps": 7064, "loss": 0.8498, "reward": null, "learning_rate": 4.248798199691998e-05, "epoch": 0.51, "percentage": 25.34, "elapsed_time": "4:59:55", "remaining_time": "14:43:42"} +{"current_steps": 1790, "total_steps": 7064, "loss": 0.8498, "reward": null, "learning_rate": 4.248798199691998e-05, "epoch": 0.51, "percentage": 25.34, "elapsed_time": "4:59:53", "remaining_time": "14:43:36"} +{"current_steps": 1790, "total_steps": 7064, "loss": 0.8498, "reward": null, "learning_rate": 4.248798199691998e-05, "epoch": 0.51, "percentage": 25.34, "elapsed_time": "4:59:54", "remaining_time": "14:43:38"} +{"current_steps": 1800, "total_steps": 7064, "loss": 0.8361, "reward": null, "learning_rate": 4.2408356269394714e-05, "epoch": 0.51, "percentage": 25.48, "elapsed_time": "5:01:36", "remaining_time": "14:42:03"} +{"current_steps": 1800, "total_steps": 7064, "loss": 0.8361, "reward": null, "learning_rate": 4.2408356269394714e-05, "epoch": 0.51, "percentage": 25.48, "elapsed_time": "5:01:35", "remaining_time": "14:42:00"} +{"current_steps": 1800, "total_steps": 7064, "loss": 0.8361, "reward": null, "learning_rate": 4.2408356269394714e-05, "epoch": 0.51, "percentage": 25.48, "elapsed_time": "5:01:34", "remaining_time": "14:41:57"} +{"current_steps": 1800, "total_steps": 7064, "loss": 0.8361, "reward": null, "learning_rate": 4.2408356269394714e-05, "epoch": 0.51, "percentage": 25.48, "elapsed_time": "5:05:28", "remaining_time": "14:53:19"} +{"current_steps": 1810, "total_steps": 7064, "loss": 0.8237, "reward": null, "learning_rate": 4.2328386227288445e-05, "epoch": 0.51, "percentage": 25.62, "elapsed_time": "5:07:09", "remaining_time": "14:51:35"} +{"current_steps": 1810, "total_steps": 7064, "loss": 0.8237, "reward": null, "learning_rate": 4.2328386227288445e-05, "epoch": 0.51, "percentage": 25.62, "elapsed_time": "5:03:17", "remaining_time": "14:40:23"} +{"current_steps": 1810, "total_steps": 7064, "loss": 0.8237, "reward": null, "learning_rate": 4.2328386227288445e-05, "epoch": 0.51, "percentage": 25.62, "elapsed_time": "5:03:16", "remaining_time": "14:40:20"} +{"current_steps": 1810, "total_steps": 7064, "loss": 0.8237, "reward": null, "learning_rate": 4.2328386227288445e-05, "epoch": 0.51, "percentage": 25.62, "elapsed_time": "5:03:15", "remaining_time": "14:40:18"} +{"current_steps": 1820, "total_steps": 7064, "loss": 0.8413, "reward": null, "learning_rate": 4.224807345230429e-05, "epoch": 0.52, "percentage": 25.76, "elapsed_time": "5:08:50", "remaining_time": "14:49:51"} +{"current_steps": 1820, "total_steps": 7064, "loss": 0.8413, "reward": null, "learning_rate": 4.224807345230429e-05, "epoch": 0.52, "percentage": 25.76, "elapsed_time": "5:04:58", "remaining_time": "14:38:45"} +{"current_steps": 1820, "total_steps": 7064, "loss": 0.8413, "reward": null, "learning_rate": 4.224807345230429e-05, "epoch": 0.52, "percentage": 25.76, "elapsed_time": "5:04:57", "remaining_time": "14:38:41"} +{"current_steps": 1820, "total_steps": 7064, "loss": 0.8413, "reward": null, "learning_rate": 4.224807345230429e-05, "epoch": 0.52, "percentage": 25.76, "elapsed_time": "5:04:56", "remaining_time": "14:38:39"} +{"current_steps": 1830, "total_steps": 7064, "loss": 0.823, "reward": null, "learning_rate": 4.21674195329242e-05, "epoch": 0.52, "percentage": 25.91, "elapsed_time": "5:10:32", "remaining_time": "14:48:12"} +{"current_steps": 1830, "total_steps": 7064, "loss": 0.823, "reward": null, "learning_rate": 4.21674195329242e-05, "epoch": 0.52, "percentage": 25.91, "elapsed_time": "5:06:41", "remaining_time": "14:37:10"} +{"current_steps": 1830, "total_steps": 7064, "loss": 0.823, "reward": null, "learning_rate": 4.21674195329242e-05, "epoch": 0.52, "percentage": 25.91, "elapsed_time": "5:06:39", "remaining_time": "14:37:04"} +{"current_steps": 1830, "total_steps": 7064, "loss": 0.823, "reward": null, "learning_rate": 4.21674195329242e-05, "epoch": 0.52, "percentage": 25.91, "elapsed_time": "5:06:40", "remaining_time": "14:37:07"} +{"current_steps": 1840, "total_steps": 7064, "loss": 0.8501, "reward": null, "learning_rate": 4.208642606437748e-05, "epoch": 0.52, "percentage": 26.05, "elapsed_time": "5:12:14", "remaining_time": "14:46:30"} +{"current_steps": 1840, "total_steps": 7064, "loss": 0.8501, "reward": null, "learning_rate": 4.208642606437748e-05, "epoch": 0.52, "percentage": 26.05, "elapsed_time": "5:08:23", "remaining_time": "14:35:33"} +{"current_steps": 1840, "total_steps": 7064, "loss": 0.8501, "reward": null, "learning_rate": 4.208642606437748e-05, "epoch": 0.52, "percentage": 26.05, "elapsed_time": "5:08:21", "remaining_time": "14:35:27"} +{"current_steps": 1840, "total_steps": 7064, "loss": 0.8501, "reward": null, "learning_rate": 4.208642606437748e-05, "epoch": 0.52, "percentage": 26.05, "elapsed_time": "5:08:22", "remaining_time": "14:35:30"} +{"current_steps": 1850, "total_steps": 7064, "loss": 0.8372, "reward": null, "learning_rate": 4.2005094648609325e-05, "epoch": 0.52, "percentage": 26.19, "elapsed_time": "5:13:57", "remaining_time": "14:44:51"} +{"current_steps": 1850, "total_steps": 7064, "loss": 0.8372, "reward": null, "learning_rate": 4.2005094648609325e-05, "epoch": 0.52, "percentage": 26.19, "elapsed_time": "5:10:06", "remaining_time": "14:33:59"} +{"current_steps": 1850, "total_steps": 7064, "loss": 0.8372, "reward": null, "learning_rate": 4.2005094648609325e-05, "epoch": 0.52, "percentage": 26.19, "elapsed_time": "5:10:04", "remaining_time": "14:33:54"} +{"current_steps": 1850, "total_steps": 7064, "loss": 0.8372, "reward": null, "learning_rate": 4.2005094648609325e-05, "epoch": 0.52, "percentage": 26.19, "elapsed_time": "5:10:05", "remaining_time": "14:33:56"} +{"current_steps": 1860, "total_steps": 7064, "loss": 0.8072, "reward": null, "learning_rate": 4.192342689424903e-05, "epoch": 0.53, "percentage": 26.33, "elapsed_time": "5:11:48", "remaining_time": "14:32:24"} +{"current_steps": 1860, "total_steps": 7064, "loss": 0.8072, "reward": null, "learning_rate": 4.192342689424903e-05, "epoch": 0.53, "percentage": 26.33, "elapsed_time": "5:11:47", "remaining_time": "14:32:21"} +{"current_steps": 1860, "total_steps": 7064, "loss": 0.8072, "reward": null, "learning_rate": 4.192342689424903e-05, "epoch": 0.53, "percentage": 26.33, "elapsed_time": "5:11:46", "remaining_time": "14:32:18"} +{"current_steps": 1860, "total_steps": 7064, "loss": 0.8072, "reward": null, "learning_rate": 4.192342689424903e-05, "epoch": 0.53, "percentage": 26.33, "elapsed_time": "5:15:39", "remaining_time": "14:43:11"} +{"current_steps": 1870, "total_steps": 7064, "loss": 0.8409, "reward": null, "learning_rate": 4.184142441657827e-05, "epoch": 0.53, "percentage": 26.47, "elapsed_time": "5:17:20", "remaining_time": "14:41:25"} +{"current_steps": 1870, "total_steps": 7064, "loss": 0.8409, "reward": null, "learning_rate": 4.184142441657827e-05, "epoch": 0.53, "percentage": 26.47, "elapsed_time": "5:13:28", "remaining_time": "14:30:40"} +{"current_steps": 1870, "total_steps": 7064, "loss": 0.8409, "reward": null, "learning_rate": 4.184142441657827e-05, "epoch": 0.53, "percentage": 26.47, "elapsed_time": "5:13:27", "remaining_time": "14:30:37"} +{"current_steps": 1870, "total_steps": 7064, "loss": 0.8409, "reward": null, "learning_rate": 4.184142441657827e-05, "epoch": 0.53, "percentage": 26.47, "elapsed_time": "5:13:29", "remaining_time": "14:30:43"} +{"current_steps": 1880, "total_steps": 7064, "loss": 0.856, "reward": null, "learning_rate": 4.1759088837499095e-05, "epoch": 0.53, "percentage": 26.61, "elapsed_time": "5:19:02", "remaining_time": "14:39:43"} +{"current_steps": 1880, "total_steps": 7064, "loss": 0.856, "reward": null, "learning_rate": 4.1759088837499095e-05, "epoch": 0.53, "percentage": 26.61, "elapsed_time": "5:15:10", "remaining_time": "14:29:05"} +{"current_steps": 1880, "total_steps": 7064, "loss": 0.856, "reward": null, "learning_rate": 4.1759088837499095e-05, "epoch": 0.53, "percentage": 26.61, "elapsed_time": "5:15:09", "remaining_time": "14:29:02"} +{"current_steps": 1880, "total_steps": 7064, "loss": 0.856, "reward": null, "learning_rate": 4.1759088837499095e-05, "epoch": 0.53, "percentage": 26.61, "elapsed_time": "5:15:08", "remaining_time": "14:29:00"} +{"current_steps": 1890, "total_steps": 7064, "loss": 0.8428, "reward": null, "learning_rate": 4.167642178550186e-05, "epoch": 0.54, "percentage": 26.76, "elapsed_time": "5:20:42", "remaining_time": "14:37:58"} +{"current_steps": 1890, "total_steps": 7064, "loss": 0.8428, "reward": null, "learning_rate": 4.167642178550186e-05, "epoch": 0.54, "percentage": 26.76, "elapsed_time": "5:16:51", "remaining_time": "14:27:24"} +{"current_steps": 1890, "total_steps": 7064, "loss": 0.8428, "reward": null, "learning_rate": 4.167642178550186e-05, "epoch": 0.54, "percentage": 26.76, "elapsed_time": "5:16:50", "remaining_time": "14:27:21"} +{"current_steps": 1890, "total_steps": 7064, "loss": 0.8428, "reward": null, "learning_rate": 4.167642178550186e-05, "epoch": 0.54, "percentage": 26.76, "elapsed_time": "5:16:49", "remaining_time": "14:27:19"} +{"current_steps": 1900, "total_steps": 7064, "loss": 0.8344, "reward": null, "learning_rate": 4.159342489563304e-05, "epoch": 0.54, "percentage": 26.9, "elapsed_time": "5:22:24", "remaining_time": "14:36:16"} +{"current_steps": 1900, "total_steps": 7064, "loss": 0.8344, "reward": null, "learning_rate": 4.159342489563304e-05, "epoch": 0.54, "percentage": 26.9, "elapsed_time": "5:18:32", "remaining_time": "14:25:44"} +{"current_steps": 1900, "total_steps": 7064, "loss": 0.8344, "reward": null, "learning_rate": 4.159342489563304e-05, "epoch": 0.54, "percentage": 26.9, "elapsed_time": "5:18:31", "remaining_time": "14:25:42"} +{"current_steps": 1900, "total_steps": 7064, "loss": 0.8344, "reward": null, "learning_rate": 4.159342489563304e-05, "epoch": 0.54, "percentage": 26.9, "elapsed_time": "5:18:33", "remaining_time": "14:25:47"} +{"current_steps": 1910, "total_steps": 7064, "loss": 0.8317, "reward": null, "learning_rate": 4.151009980946287e-05, "epoch": 0.54, "percentage": 27.04, "elapsed_time": "5:24:01", "remaining_time": "14:34:21"} +{"current_steps": 1910, "total_steps": 7064, "loss": 0.8317, "reward": null, "learning_rate": 4.151009980946287e-05, "epoch": 0.54, "percentage": 27.04, "elapsed_time": "5:20:09", "remaining_time": "14:23:54"} +{"current_steps": 1910, "total_steps": 7064, "loss": 0.8317, "reward": null, "learning_rate": 4.151009980946287e-05, "epoch": 0.54, "percentage": 27.04, "elapsed_time": "5:20:10", "remaining_time": "14:23:57"} +{"current_steps": 1910, "total_steps": 7064, "loss": 0.8317, "reward": null, "learning_rate": 4.151009980946287e-05, "epoch": 0.54, "percentage": 27.04, "elapsed_time": "5:20:08", "remaining_time": "14:23:52"} +{"current_steps": 1920, "total_steps": 7064, "loss": 0.8172, "reward": null, "learning_rate": 4.142644817505284e-05, "epoch": 0.54, "percentage": 27.18, "elapsed_time": "5:25:46", "remaining_time": "14:32:47"} +{"current_steps": 1920, "total_steps": 7064, "loss": 0.8172, "reward": null, "learning_rate": 4.142644817505284e-05, "epoch": 0.54, "percentage": 27.18, "elapsed_time": "5:21:54", "remaining_time": "14:22:27"} +{"current_steps": 1920, "total_steps": 7064, "loss": 0.8172, "reward": null, "learning_rate": 4.142644817505284e-05, "epoch": 0.54, "percentage": 27.18, "elapsed_time": "5:21:53", "remaining_time": "14:22:24"} +{"current_steps": 1920, "total_steps": 7064, "loss": 0.8172, "reward": null, "learning_rate": 4.142644817505284e-05, "epoch": 0.54, "percentage": 27.18, "elapsed_time": "5:21:52", "remaining_time": "14:22:22"} +{"current_steps": 1930, "total_steps": 7064, "loss": 0.8305, "reward": null, "learning_rate": 4.1342471646923196e-05, "epoch": 0.55, "percentage": 27.32, "elapsed_time": "5:27:26", "remaining_time": "14:31:00"} +{"current_steps": 1930, "total_steps": 7064, "loss": 0.8305, "reward": null, "learning_rate": 4.1342471646923196e-05, "epoch": 0.55, "percentage": 27.32, "elapsed_time": "5:23:34", "remaining_time": "14:20:45"} +{"current_steps": 1930, "total_steps": 7064, "loss": 0.8305, "reward": null, "learning_rate": 4.1342471646923196e-05, "epoch": 0.55, "percentage": 27.32, "elapsed_time": "5:23:32", "remaining_time": "14:20:40"} +{"current_steps": 1930, "total_steps": 7064, "loss": 0.8305, "reward": null, "learning_rate": 4.1342471646923196e-05, "epoch": 0.55, "percentage": 27.32, "elapsed_time": "5:23:33", "remaining_time": "14:20:42"} +{"current_steps": 1940, "total_steps": 7064, "loss": 0.8303, "reward": null, "learning_rate": 4.1258171886020124e-05, "epoch": 0.55, "percentage": 27.46, "elapsed_time": "5:29:04", "remaining_time": "14:29:10"} +{"current_steps": 1940, "total_steps": 7064, "loss": 0.8303, "reward": null, "learning_rate": 4.1258171886020124e-05, "epoch": 0.55, "percentage": 27.46, "elapsed_time": "5:25:12", "remaining_time": "14:18:57"} +{"current_steps": 1940, "total_steps": 7064, "loss": 0.8303, "reward": null, "learning_rate": 4.1258171886020124e-05, "epoch": 0.55, "percentage": 27.46, "elapsed_time": "5:25:13", "remaining_time": "14:19:00"} +{"current_steps": 1940, "total_steps": 7064, "loss": 0.8303, "reward": null, "learning_rate": 4.1258171886020124e-05, "epoch": 0.55, "percentage": 27.46, "elapsed_time": "5:25:11", "remaining_time": "14:18:54"} +{"current_steps": 1950, "total_steps": 7064, "loss": 0.8292, "reward": null, "learning_rate": 4.117355055968295e-05, "epoch": 0.55, "percentage": 27.6, "elapsed_time": "5:30:45", "remaining_time": "14:27:25"} +{"current_steps": 1950, "total_steps": 7064, "loss": 0.8292, "reward": null, "learning_rate": 4.117355055968295e-05, "epoch": 0.55, "percentage": 27.6, "elapsed_time": "5:26:52", "remaining_time": "14:17:13"} +{"current_steps": 1950, "total_steps": 7064, "loss": 0.8292, "reward": null, "learning_rate": 4.117355055968295e-05, "epoch": 0.55, "percentage": 27.6, "elapsed_time": "5:26:53", "remaining_time": "14:17:16"} +{"current_steps": 1950, "total_steps": 7064, "loss": 0.8292, "reward": null, "learning_rate": 4.117355055968295e-05, "epoch": 0.55, "percentage": 27.6, "elapsed_time": "5:26:54", "remaining_time": "14:17:19"} +{"current_steps": 1960, "total_steps": 7064, "loss": 0.8162, "reward": null, "learning_rate": 4.1088609341611135e-05, "epoch": 0.55, "percentage": 27.75, "elapsed_time": "5:32:28", "remaining_time": "14:25:46"} +{"current_steps": 1960, "total_steps": 7064, "loss": 0.8162, "reward": null, "learning_rate": 4.1088609341611135e-05, "epoch": 0.55, "percentage": 27.75, "elapsed_time": "5:28:34", "remaining_time": "14:15:39"} +{"current_steps": 1960, "total_steps": 7064, "loss": 0.8162, "reward": null, "learning_rate": 4.1088609341611135e-05, "epoch": 0.55, "percentage": 27.75, "elapsed_time": "5:28:35", "remaining_time": "14:15:41"} +{"current_steps": 1960, "total_steps": 7064, "loss": 0.8162, "reward": null, "learning_rate": 4.1088609341611135e-05, "epoch": 0.55, "percentage": 27.75, "elapsed_time": "5:28:36", "remaining_time": "14:15:44"} +{"current_steps": 1970, "total_steps": 7064, "loss": 0.8344, "reward": null, "learning_rate": 4.1003349911831166e-05, "epoch": 0.56, "percentage": 27.89, "elapsed_time": "5:34:09", "remaining_time": "14:24:02"} +{"current_steps": 1970, "total_steps": 7064, "loss": 0.8344, "reward": null, "learning_rate": 4.1003349911831166e-05, "epoch": 0.56, "percentage": 27.89, "elapsed_time": "5:30:15", "remaining_time": "14:13:59"} +{"current_steps": 1970, "total_steps": 7064, "loss": 0.8344, "reward": null, "learning_rate": 4.1003349911831166e-05, "epoch": 0.56, "percentage": 27.89, "elapsed_time": "5:30:16", "remaining_time": "14:14:01"} +{"current_steps": 1970, "total_steps": 7064, "loss": 0.8344, "reward": null, "learning_rate": 4.1003349911831166e-05, "epoch": 0.56, "percentage": 27.89, "elapsed_time": "5:30:17", "remaining_time": "14:14:04"} +{"current_steps": 1980, "total_steps": 7064, "loss": 0.8545, "reward": null, "learning_rate": 4.091777395666338e-05, "epoch": 0.56, "percentage": 28.03, "elapsed_time": "5:35:53", "remaining_time": "14:22:26"} +{"current_steps": 1980, "total_steps": 7064, "loss": 0.8545, "reward": null, "learning_rate": 4.091777395666338e-05, "epoch": 0.56, "percentage": 28.03, "elapsed_time": "5:32:00", "remaining_time": "14:12:29"} +{"current_steps": 1980, "total_steps": 7064, "loss": 0.8545, "reward": null, "learning_rate": 4.091777395666338e-05, "epoch": 0.56, "percentage": 28.03, "elapsed_time": "5:32:01", "remaining_time": "14:12:32"} +{"current_steps": 1980, "total_steps": 7064, "loss": 0.8545, "reward": null, "learning_rate": 4.091777395666338e-05, "epoch": 0.56, "percentage": 28.03, "elapsed_time": "5:31:59", "remaining_time": "14:12:27"} +{"current_steps": 1990, "total_steps": 7064, "loss": 0.8305, "reward": null, "learning_rate": 4.0831883168688534e-05, "epoch": 0.56, "percentage": 28.17, "elapsed_time": "5:33:43", "remaining_time": "14:10:54"} +{"current_steps": 1990, "total_steps": 7064, "loss": 0.8305, "reward": null, "learning_rate": 4.0831883168688534e-05, "epoch": 0.56, "percentage": 28.17, "elapsed_time": "5:33:42", "remaining_time": "14:10:51"} +{"current_steps": 1990, "total_steps": 7064, "loss": 0.8305, "reward": null, "learning_rate": 4.0831883168688534e-05, "epoch": 0.56, "percentage": 28.17, "elapsed_time": "5:33:41", "remaining_time": "14:10:49"} +{"current_steps": 1990, "total_steps": 7064, "loss": 0.8305, "reward": null, "learning_rate": 4.0831883168688534e-05, "epoch": 0.56, "percentage": 28.17, "elapsed_time": "5:37:34", "remaining_time": "14:20:43"} +{"current_steps": 2000, "total_steps": 7064, "loss": 0.8365, "reward": null, "learning_rate": 4.07456792467144e-05, "epoch": 0.57, "percentage": 28.31, "elapsed_time": "5:39:18", "remaining_time": "14:19:08"} +{"current_steps": 2000, "total_steps": 7064, "loss": 0.8365, "reward": null, "learning_rate": 4.07456792467144e-05, "epoch": 0.57, "percentage": 28.31, "elapsed_time": "5:35:27", "remaining_time": "14:09:22"} +{"current_steps": 2000, "total_steps": 7064, "loss": 0.8365, "reward": null, "learning_rate": 4.07456792467144e-05, "epoch": 0.57, "percentage": 28.31, "elapsed_time": "5:35:25", "remaining_time": "14:09:17"} +{"current_steps": 2000, "total_steps": 7064, "loss": 0.8365, "reward": null, "learning_rate": 4.07456792467144e-05, "epoch": 0.57, "percentage": 28.31, "elapsed_time": "5:35:26", "remaining_time": "14:09:19"} +{"current_steps": 2010, "total_steps": 7064, "loss": 0.8375, "reward": null, "learning_rate": 4.065916389574211e-05, "epoch": 0.57, "percentage": 28.45, "elapsed_time": "5:37:08", "remaining_time": "14:07:42"} +{"current_steps": 2010, "total_steps": 7064, "loss": 0.8375, "reward": null, "learning_rate": 4.065916389574211e-05, "epoch": 0.57, "percentage": 28.45, "elapsed_time": "5:41:00", "remaining_time": "14:17:27"} +{"current_steps": 2010, "total_steps": 7064, "loss": 0.8375, "reward": null, "learning_rate": 4.065916389574211e-05, "epoch": 0.57, "percentage": 28.45, "elapsed_time": "5:37:09", "remaining_time": "14:07:45"} +{"current_steps": 2010, "total_steps": 7064, "loss": 0.8375, "reward": null, "learning_rate": 4.065916389574211e-05, "epoch": 0.57, "percentage": 28.45, "elapsed_time": "5:37:07", "remaining_time": "14:07:40"} +{"current_steps": 2020, "total_steps": 7064, "loss": 0.8351, "reward": null, "learning_rate": 4.057233882693246e-05, "epoch": 0.57, "percentage": 28.6, "elapsed_time": "5:42:42", "remaining_time": "14:15:46"} +{"current_steps": 2020, "total_steps": 7064, "loss": 0.8351, "reward": null, "learning_rate": 4.057233882693246e-05, "epoch": 0.57, "percentage": 28.6, "elapsed_time": "5:38:51", "remaining_time": "14:06:08"} +{"current_steps": 2020, "total_steps": 7064, "loss": 0.8351, "reward": null, "learning_rate": 4.057233882693246e-05, "epoch": 0.57, "percentage": 28.6, "elapsed_time": "5:38:50", "remaining_time": "14:06:05"} +{"current_steps": 2020, "total_steps": 7064, "loss": 0.8351, "reward": null, "learning_rate": 4.057233882693246e-05, "epoch": 0.57, "percentage": 28.6, "elapsed_time": "5:38:49", "remaining_time": "14:06:03"} +{"current_steps": 2030, "total_steps": 7064, "loss": 0.8165, "reward": null, "learning_rate": 4.048520575757207e-05, "epoch": 0.57, "percentage": 28.74, "elapsed_time": "5:40:36", "remaining_time": "14:04:38"} +{"current_steps": 2030, "total_steps": 7064, "loss": 0.8165, "reward": null, "learning_rate": 4.048520575757207e-05, "epoch": 0.57, "percentage": 28.74, "elapsed_time": "5:40:34", "remaining_time": "14:04:33"} +{"current_steps": 2030, "total_steps": 7064, "loss": 0.8165, "reward": null, "learning_rate": 4.048520575757207e-05, "epoch": 0.57, "percentage": 28.74, "elapsed_time": "5:40:35", "remaining_time": "14:04:36"} +{"current_steps": 2030, "total_steps": 7064, "loss": 0.8165, "reward": null, "learning_rate": 4.048520575757207e-05, "epoch": 0.57, "percentage": 28.74, "elapsed_time": "5:44:27", "remaining_time": "14:14:12"} +{"current_steps": 2040, "total_steps": 7064, "loss": 0.8194, "reward": null, "learning_rate": 4.0397766411039395e-05, "epoch": 0.58, "percentage": 28.88, "elapsed_time": "5:46:07", "remaining_time": "14:12:25"} +{"current_steps": 2040, "total_steps": 7064, "loss": 0.8194, "reward": null, "learning_rate": 4.0397766411039395e-05, "epoch": 0.58, "percentage": 28.88, "elapsed_time": "5:42:14", "remaining_time": "14:02:51"} +{"current_steps": 2040, "total_steps": 7064, "loss": 0.8194, "reward": null, "learning_rate": 4.0397766411039395e-05, "epoch": 0.58, "percentage": 28.88, "elapsed_time": "5:42:15", "remaining_time": "14:02:53"} +{"current_steps": 2040, "total_steps": 7064, "loss": 0.8194, "reward": null, "learning_rate": 4.0397766411039395e-05, "epoch": 0.58, "percentage": 28.88, "elapsed_time": "5:42:16", "remaining_time": "14:02:56"} +{"current_steps": 2050, "total_steps": 7064, "loss": 0.8218, "reward": null, "learning_rate": 4.031002251677067e-05, "epoch": 0.58, "percentage": 29.02, "elapsed_time": "5:43:53", "remaining_time": "14:01:07"} +{"current_steps": 2050, "total_steps": 7064, "loss": 0.8218, "reward": null, "learning_rate": 4.031002251677067e-05, "epoch": 0.58, "percentage": 29.02, "elapsed_time": "5:43:52", "remaining_time": "14:01:04"} +{"current_steps": 2050, "total_steps": 7064, "loss": 0.8218, "reward": null, "learning_rate": 4.031002251677067e-05, "epoch": 0.58, "percentage": 29.02, "elapsed_time": "5:43:51", "remaining_time": "14:01:02"} +{"current_steps": 2050, "total_steps": 7064, "loss": 0.8218, "reward": null, "learning_rate": 4.031002251677067e-05, "epoch": 0.58, "percentage": 29.02, "elapsed_time": "5:47:45", "remaining_time": "14:10:33"} +{"current_steps": 2060, "total_steps": 7064, "loss": 0.8203, "reward": null, "learning_rate": 4.022197581022567e-05, "epoch": 0.58, "percentage": 29.16, "elapsed_time": "5:49:29", "remaining_time": "14:08:58"} +{"current_steps": 2060, "total_steps": 7064, "loss": 0.8203, "reward": null, "learning_rate": 4.022197581022567e-05, "epoch": 0.58, "percentage": 29.16, "elapsed_time": "5:45:37", "remaining_time": "13:59:34"} +{"current_steps": 2060, "total_steps": 7064, "loss": 0.8203, "reward": null, "learning_rate": 4.022197581022567e-05, "epoch": 0.58, "percentage": 29.16, "elapsed_time": "5:45:36", "remaining_time": "13:59:31"} +{"current_steps": 2060, "total_steps": 7064, "loss": 0.8203, "reward": null, "learning_rate": 4.022197581022567e-05, "epoch": 0.58, "percentage": 29.16, "elapsed_time": "5:45:38", "remaining_time": "13:59:36"} +{"current_steps": 2070, "total_steps": 7064, "loss": 0.832, "reward": null, "learning_rate": 4.0133628032853435e-05, "epoch": 0.59, "percentage": 29.3, "elapsed_time": "5:51:09", "remaining_time": "14:07:10"} +{"current_steps": 2070, "total_steps": 7064, "loss": 0.832, "reward": null, "learning_rate": 4.0133628032853435e-05, "epoch": 0.59, "percentage": 29.3, "elapsed_time": "5:47:15", "remaining_time": "13:57:47"} +{"current_steps": 2070, "total_steps": 7064, "loss": 0.832, "reward": null, "learning_rate": 4.0133628032853435e-05, "epoch": 0.59, "percentage": 29.3, "elapsed_time": "5:47:17", "remaining_time": "13:57:52"} +{"current_steps": 2070, "total_steps": 7064, "loss": 0.832, "reward": null, "learning_rate": 4.0133628032853435e-05, "epoch": 0.59, "percentage": 29.3, "elapsed_time": "5:47:16", "remaining_time": "13:57:50"} +{"current_steps": 2080, "total_steps": 7064, "loss": 0.8066, "reward": null, "learning_rate": 4.004498093205773e-05, "epoch": 0.59, "percentage": 29.45, "elapsed_time": "5:52:49", "remaining_time": "14:05:25"} +{"current_steps": 2080, "total_steps": 7064, "loss": 0.8066, "reward": null, "learning_rate": 4.004498093205773e-05, "epoch": 0.59, "percentage": 29.45, "elapsed_time": "5:48:58", "remaining_time": "13:56:11"} +{"current_steps": 2080, "total_steps": 7064, "loss": 0.8066, "reward": null, "learning_rate": 4.004498093205773e-05, "epoch": 0.59, "percentage": 29.45, "elapsed_time": "5:48:56", "remaining_time": "13:56:06"} +{"current_steps": 2080, "total_steps": 7064, "loss": 0.8066, "reward": null, "learning_rate": 4.004498093205773e-05, "epoch": 0.59, "percentage": 29.45, "elapsed_time": "5:48:57", "remaining_time": "13:56:08"} +{"current_steps": 2090, "total_steps": 7064, "loss": 0.8421, "reward": null, "learning_rate": 3.99560362611626e-05, "epoch": 0.59, "percentage": 29.59, "elapsed_time": "5:54:29", "remaining_time": "14:03:39"} +{"current_steps": 2090, "total_steps": 7064, "loss": 0.8421, "reward": null, "learning_rate": 3.99560362611626e-05, "epoch": 0.59, "percentage": 29.59, "elapsed_time": "5:50:38", "remaining_time": "13:54:29"} +{"current_steps": 2090, "total_steps": 7064, "loss": 0.8421, "reward": null, "learning_rate": 3.99560362611626e-05, "epoch": 0.59, "percentage": 29.59, "elapsed_time": "5:50:36", "remaining_time": "13:54:24"} +{"current_steps": 2090, "total_steps": 7064, "loss": 0.8421, "reward": null, "learning_rate": 3.99560362611626e-05, "epoch": 0.59, "percentage": 29.59, "elapsed_time": "5:50:37", "remaining_time": "13:54:26"} +{"current_steps": 2100, "total_steps": 7064, "loss": 0.8217, "reward": null, "learning_rate": 3.986679577937762e-05, "epoch": 0.59, "percentage": 29.73, "elapsed_time": "5:56:13", "remaining_time": "14:02:03"} +{"current_steps": 2100, "total_steps": 7064, "loss": 0.8217, "reward": null, "learning_rate": 3.986679577937762e-05, "epoch": 0.59, "percentage": 29.73, "elapsed_time": "5:52:21", "remaining_time": "13:52:54"} +{"current_steps": 2100, "total_steps": 7064, "loss": 0.8217, "reward": null, "learning_rate": 3.986679577937762e-05, "epoch": 0.59, "percentage": 29.73, "elapsed_time": "5:52:20", "remaining_time": "13:52:51"} +{"current_steps": 2100, "total_steps": 7064, "loss": 0.8217, "reward": null, "learning_rate": 3.986679577937762e-05, "epoch": 0.59, "percentage": 29.73, "elapsed_time": "5:52:22", "remaining_time": "13:52:56"} +{"current_steps": 2110, "total_steps": 7064, "loss": 0.8268, "reward": null, "learning_rate": 3.9777261251763145e-05, "epoch": 0.6, "percentage": 29.87, "elapsed_time": "5:58:00", "remaining_time": "14:00:34"} +{"current_steps": 2110, "total_steps": 7064, "loss": 0.8268, "reward": null, "learning_rate": 3.9777261251763145e-05, "epoch": 0.6, "percentage": 29.87, "elapsed_time": "5:54:09", "remaining_time": "13:51:31"} +{"current_steps": 2110, "total_steps": 7064, "loss": 0.8268, "reward": null, "learning_rate": 3.9777261251763145e-05, "epoch": 0.6, "percentage": 29.87, "elapsed_time": "5:54:07", "remaining_time": "13:51:26"} +{"current_steps": 2110, "total_steps": 7064, "loss": 0.8268, "reward": null, "learning_rate": 3.9777261251763145e-05, "epoch": 0.6, "percentage": 29.87, "elapsed_time": "5:54:08", "remaining_time": "13:51:28"} +{"current_steps": 2120, "total_steps": 7064, "loss": 0.8321, "reward": null, "learning_rate": 3.9687434449195316e-05, "epoch": 0.6, "percentage": 30.01, "elapsed_time": "5:55:50", "remaining_time": "13:49:51"} +{"current_steps": 2120, "total_steps": 7064, "loss": 0.8321, "reward": null, "learning_rate": 3.9687434449195316e-05, "epoch": 0.6, "percentage": 30.01, "elapsed_time": "5:55:51", "remaining_time": "13:49:53"} +{"current_steps": 2120, "total_steps": 7064, "loss": 0.8321, "reward": null, "learning_rate": 3.9687434449195316e-05, "epoch": 0.6, "percentage": 30.01, "elapsed_time": "5:55:49", "remaining_time": "13:49:49"} +{"current_steps": 2120, "total_steps": 7064, "loss": 0.8321, "reward": null, "learning_rate": 3.9687434449195316e-05, "epoch": 0.6, "percentage": 30.01, "elapsed_time": "5:59:43", "remaining_time": "13:58:53"} +{"current_steps": 2130, "total_steps": 7064, "loss": 0.8266, "reward": null, "learning_rate": 3.959731714833115e-05, "epoch": 0.6, "percentage": 30.15, "elapsed_time": "6:01:28", "remaining_time": "13:57:18"} +{"current_steps": 2130, "total_steps": 7064, "loss": 0.8266, "reward": null, "learning_rate": 3.959731714833115e-05, "epoch": 0.6, "percentage": 30.15, "elapsed_time": "5:57:36", "remaining_time": "13:48:23"} +{"current_steps": 2130, "total_steps": 7064, "loss": 0.8266, "reward": null, "learning_rate": 3.959731714833115e-05, "epoch": 0.6, "percentage": 30.15, "elapsed_time": "5:57:35", "remaining_time": "13:48:20"} +{"current_steps": 2130, "total_steps": 7064, "loss": 0.8266, "reward": null, "learning_rate": 3.959731714833115e-05, "epoch": 0.6, "percentage": 30.15, "elapsed_time": "5:57:34", "remaining_time": "13:48:18"} +{"current_steps": 2140, "total_steps": 7064, "loss": 0.82, "reward": null, "learning_rate": 3.95069111315733e-05, "epoch": 0.61, "percentage": 30.29, "elapsed_time": "6:03:09", "remaining_time": "13:55:35"} +{"current_steps": 2140, "total_steps": 7064, "loss": 0.82, "reward": null, "learning_rate": 3.95069111315733e-05, "epoch": 0.61, "percentage": 30.29, "elapsed_time": "5:59:16", "remaining_time": "13:46:41"} +{"current_steps": 2140, "total_steps": 7064, "loss": 0.82, "reward": null, "learning_rate": 3.95069111315733e-05, "epoch": 0.61, "percentage": 30.29, "elapsed_time": "5:59:17", "remaining_time": "13:46:43"} +{"current_steps": 2140, "total_steps": 7064, "loss": 0.82, "reward": null, "learning_rate": 3.95069111315733e-05, "epoch": 0.61, "percentage": 30.29, "elapsed_time": "5:59:15", "remaining_time": "13:46:38"} +{"current_steps": 2150, "total_steps": 7064, "loss": 0.8347, "reward": null, "learning_rate": 3.9416218187034876e-05, "epoch": 0.61, "percentage": 30.44, "elapsed_time": "6:00:58", "remaining_time": "13:45:02"} +{"current_steps": 2150, "total_steps": 7064, "loss": 0.8347, "reward": null, "learning_rate": 3.9416218187034876e-05, "epoch": 0.61, "percentage": 30.44, "elapsed_time": "6:00:57", "remaining_time": "13:45:00"} +{"current_steps": 2150, "total_steps": 7064, "loss": 0.8347, "reward": null, "learning_rate": 3.9416218187034876e-05, "epoch": 0.61, "percentage": 30.44, "elapsed_time": "6:00:56", "remaining_time": "13:44:58"} +{"current_steps": 2150, "total_steps": 7064, "loss": 0.8347, "reward": null, "learning_rate": 3.9416218187034876e-05, "epoch": 0.61, "percentage": 30.44, "elapsed_time": "6:04:49", "remaining_time": "13:53:51"} +{"current_steps": 2160, "total_steps": 7064, "loss": 0.8472, "reward": null, "learning_rate": 3.9325240108504016e-05, "epoch": 0.61, "percentage": 30.58, "elapsed_time": "6:06:36", "remaining_time": "13:52:20"} +{"current_steps": 2160, "total_steps": 7064, "loss": 0.8472, "reward": null, "learning_rate": 3.9325240108504016e-05, "epoch": 0.61, "percentage": 30.58, "elapsed_time": "6:02:44", "remaining_time": "13:43:33"} +{"current_steps": 2160, "total_steps": 7064, "loss": 0.8472, "reward": null, "learning_rate": 3.9325240108504016e-05, "epoch": 0.61, "percentage": 30.58, "elapsed_time": "6:02:43", "remaining_time": "13:43:30"} +{"current_steps": 2160, "total_steps": 7064, "loss": 0.8472, "reward": null, "learning_rate": 3.9325240108504016e-05, "epoch": 0.61, "percentage": 30.58, "elapsed_time": "6:02:45", "remaining_time": "13:43:35"} +{"current_steps": 2170, "total_steps": 7064, "loss": 0.8092, "reward": null, "learning_rate": 3.923397869540845e-05, "epoch": 0.61, "percentage": 30.72, "elapsed_time": "6:04:22", "remaining_time": "13:41:46"} +{"current_steps": 2170, "total_steps": 7064, "loss": 0.8092, "reward": null, "learning_rate": 3.923397869540845e-05, "epoch": 0.61, "percentage": 30.72, "elapsed_time": "6:04:23", "remaining_time": "13:41:49"} +{"current_steps": 2170, "total_steps": 7064, "loss": 0.8092, "reward": null, "learning_rate": 3.923397869540845e-05, "epoch": 0.61, "percentage": 30.72, "elapsed_time": "6:04:21", "remaining_time": "13:41:44"} +{"current_steps": 2170, "total_steps": 7064, "loss": 0.8092, "reward": null, "learning_rate": 3.923397869540845e-05, "epoch": 0.61, "percentage": 30.72, "elapsed_time": "6:08:15", "remaining_time": "13:50:30"} +{"current_steps": 2180, "total_steps": 7064, "loss": 0.8166, "reward": null, "learning_rate": 3.91424357527799e-05, "epoch": 0.62, "percentage": 30.86, "elapsed_time": "6:05:59", "remaining_time": "13:39:57"} +{"current_steps": 2180, "total_steps": 7064, "loss": 0.8166, "reward": null, "learning_rate": 3.91424357527799e-05, "epoch": 0.62, "percentage": 30.86, "elapsed_time": "6:09:51", "remaining_time": "13:48:37"} +{"current_steps": 2180, "total_steps": 7064, "loss": 0.8166, "reward": null, "learning_rate": 3.91424357527799e-05, "epoch": 0.62, "percentage": 30.86, "elapsed_time": "6:05:58", "remaining_time": "13:39:55"} +{"current_steps": 2180, "total_steps": 7064, "loss": 0.8166, "reward": null, "learning_rate": 3.91424357527799e-05, "epoch": 0.62, "percentage": 30.86, "elapsed_time": "6:06:00", "remaining_time": "13:39:59"} +{"current_steps": 2190, "total_steps": 7064, "loss": 0.817, "reward": null, "learning_rate": 3.905061309121837e-05, "epoch": 0.62, "percentage": 31.0, "elapsed_time": "6:07:40", "remaining_time": "13:38:16"} +{"current_steps": 2190, "total_steps": 7064, "loss": 0.817, "reward": null, "learning_rate": 3.905061309121837e-05, "epoch": 0.62, "percentage": 31.0, "elapsed_time": "6:07:38", "remaining_time": "13:38:12"} +{"current_steps": 2190, "total_steps": 7064, "loss": 0.817, "reward": null, "learning_rate": 3.905061309121837e-05, "epoch": 0.62, "percentage": 31.0, "elapsed_time": "6:07:39", "remaining_time": "13:38:14"} +{"current_steps": 2190, "total_steps": 7064, "loss": 0.817, "reward": null, "learning_rate": 3.905061309121837e-05, "epoch": 0.62, "percentage": 31.0, "elapsed_time": "6:11:31", "remaining_time": "13:46:51"} +{"current_steps": 2200, "total_steps": 7064, "loss": 0.8073, "reward": null, "learning_rate": 3.895851252685634e-05, "epoch": 0.62, "percentage": 31.14, "elapsed_time": "6:09:21", "remaining_time": "13:36:38"} +{"current_steps": 2200, "total_steps": 7064, "loss": 0.8073, "reward": null, "learning_rate": 3.895851252685634e-05, "epoch": 0.62, "percentage": 31.14, "elapsed_time": "6:13:15", "remaining_time": "13:45:13"} +{"current_steps": 2200, "total_steps": 7064, "loss": 0.8073, "reward": null, "learning_rate": 3.895851252685634e-05, "epoch": 0.62, "percentage": 31.14, "elapsed_time": "6:09:22", "remaining_time": "13:36:40"} +{"current_steps": 2200, "total_steps": 7064, "loss": 0.8073, "reward": null, "learning_rate": 3.895851252685634e-05, "epoch": 0.62, "percentage": 31.14, "elapsed_time": "6:09:23", "remaining_time": "13:36:42"} +{"current_steps": 2210, "total_steps": 7064, "loss": 0.8355, "reward": null, "learning_rate": 3.886613588132284e-05, "epoch": 0.63, "percentage": 31.29, "elapsed_time": "6:11:03", "remaining_time": "13:34:58"} +{"current_steps": 2210, "total_steps": 7064, "loss": 0.8355, "reward": null, "learning_rate": 3.886613588132284e-05, "epoch": 0.63, "percentage": 31.29, "elapsed_time": "6:11:05", "remaining_time": "13:35:03"} +{"current_steps": 2210, "total_steps": 7064, "loss": 0.8355, "reward": null, "learning_rate": 3.886613588132284e-05, "epoch": 0.63, "percentage": 31.29, "elapsed_time": "6:11:04", "remaining_time": "13:35:00"} +{"current_steps": 2210, "total_steps": 7064, "loss": 0.8355, "reward": null, "learning_rate": 3.886613588132284e-05, "epoch": 0.63, "percentage": 31.29, "elapsed_time": "6:14:56", "remaining_time": "13:43:31"} +{"current_steps": 2220, "total_steps": 7064, "loss": 0.8232, "reward": null, "learning_rate": 3.877348498170743e-05, "epoch": 0.63, "percentage": 31.43, "elapsed_time": "6:16:42", "remaining_time": "13:41:59"} +{"current_steps": 2220, "total_steps": 7064, "loss": 0.8232, "reward": null, "learning_rate": 3.877348498170743e-05, "epoch": 0.63, "percentage": 31.43, "elapsed_time": "6:12:51", "remaining_time": "13:33:34"} +{"current_steps": 2220, "total_steps": 7064, "loss": 0.8232, "reward": null, "learning_rate": 3.877348498170743e-05, "epoch": 0.63, "percentage": 31.43, "elapsed_time": "6:12:50", "remaining_time": "13:33:32"} +{"current_steps": 2220, "total_steps": 7064, "loss": 0.8232, "reward": null, "learning_rate": 3.877348498170743e-05, "epoch": 0.63, "percentage": 31.43, "elapsed_time": "6:12:49", "remaining_time": "13:33:30"} +{"current_steps": 2230, "total_steps": 7064, "loss": 0.8312, "reward": null, "learning_rate": 3.868056166052407e-05, "epoch": 0.63, "percentage": 31.57, "elapsed_time": "6:18:27", "remaining_time": "13:40:23"} +{"current_steps": 2230, "total_steps": 7064, "loss": 0.8312, "reward": null, "learning_rate": 3.868056166052407e-05, "epoch": 0.63, "percentage": 31.57, "elapsed_time": "6:14:36", "remaining_time": "13:32:01"} +{"current_steps": 2230, "total_steps": 7064, "loss": 0.8312, "reward": null, "learning_rate": 3.868056166052407e-05, "epoch": 0.63, "percentage": 31.57, "elapsed_time": "6:14:34", "remaining_time": "13:31:57"} +{"current_steps": 2230, "total_steps": 7064, "loss": 0.8312, "reward": null, "learning_rate": 3.868056166052407e-05, "epoch": 0.63, "percentage": 31.57, "elapsed_time": "6:14:35", "remaining_time": "13:31:59"} +{"current_steps": 2240, "total_steps": 7064, "loss": 0.8215, "reward": null, "learning_rate": 3.858736775567484e-05, "epoch": 0.63, "percentage": 31.71, "elapsed_time": "6:20:07", "remaining_time": "13:38:37"} +{"current_steps": 2240, "total_steps": 7064, "loss": 0.8215, "reward": null, "learning_rate": 3.858736775567484e-05, "epoch": 0.63, "percentage": 31.71, "elapsed_time": "6:16:14", "remaining_time": "13:30:16"} +{"current_steps": 2240, "total_steps": 7064, "loss": 0.8215, "reward": null, "learning_rate": 3.858736775567484e-05, "epoch": 0.63, "percentage": 31.71, "elapsed_time": "6:16:15", "remaining_time": "13:30:18"} +{"current_steps": 2240, "total_steps": 7064, "loss": 0.8215, "reward": null, "learning_rate": 3.858736775567484e-05, "epoch": 0.63, "percentage": 31.71, "elapsed_time": "6:16:13", "remaining_time": "13:30:14"} +{"current_steps": 2250, "total_steps": 7064, "loss": 0.8263, "reward": null, "learning_rate": 3.8493905110413626e-05, "epoch": 0.64, "percentage": 31.85, "elapsed_time": "6:21:50", "remaining_time": "13:36:59"} +{"current_steps": 2250, "total_steps": 7064, "loss": 0.8263, "reward": null, "learning_rate": 3.8493905110413626e-05, "epoch": 0.64, "percentage": 31.85, "elapsed_time": "6:17:57", "remaining_time": "13:28:40"} +{"current_steps": 2250, "total_steps": 7064, "loss": 0.8263, "reward": null, "learning_rate": 3.8493905110413626e-05, "epoch": 0.64, "percentage": 31.85, "elapsed_time": "6:17:58", "remaining_time": "13:28:42"} +{"current_steps": 2250, "total_steps": 7064, "loss": 0.8263, "reward": null, "learning_rate": 3.8493905110413626e-05, "epoch": 0.64, "percentage": 31.85, "elapsed_time": "6:17:59", "remaining_time": "13:28:44"} +{"current_steps": 2260, "total_steps": 7064, "loss": 0.8282, "reward": null, "learning_rate": 3.8400175573309646e-05, "epoch": 0.64, "percentage": 31.99, "elapsed_time": "6:23:34", "remaining_time": "13:35:21"} +{"current_steps": 2260, "total_steps": 7064, "loss": 0.8282, "reward": null, "learning_rate": 3.8400175573309646e-05, "epoch": 0.64, "percentage": 31.99, "elapsed_time": "6:19:42", "remaining_time": "13:27:07"} +{"current_steps": 2260, "total_steps": 7064, "loss": 0.8282, "reward": null, "learning_rate": 3.8400175573309646e-05, "epoch": 0.64, "percentage": 31.99, "elapsed_time": "6:19:41", "remaining_time": "13:27:05"} +{"current_steps": 2260, "total_steps": 7064, "loss": 0.8282, "reward": null, "learning_rate": 3.8400175573309646e-05, "epoch": 0.64, "percentage": 31.99, "elapsed_time": "6:19:43", "remaining_time": "13:27:09"} +{"current_steps": 2270, "total_steps": 7064, "loss": 0.8337, "reward": null, "learning_rate": 3.83061809982109e-05, "epoch": 0.64, "percentage": 32.13, "elapsed_time": "6:25:13", "remaining_time": "13:33:34"} +{"current_steps": 2270, "total_steps": 7064, "loss": 0.8337, "reward": null, "learning_rate": 3.83061809982109e-05, "epoch": 0.64, "percentage": 32.13, "elapsed_time": "6:21:22", "remaining_time": "13:25:25"} +{"current_steps": 2270, "total_steps": 7064, "loss": 0.8337, "reward": null, "learning_rate": 3.83061809982109e-05, "epoch": 0.64, "percentage": 32.13, "elapsed_time": "6:21:21", "remaining_time": "13:25:23"} +{"current_steps": 2270, "total_steps": 7064, "loss": 0.8337, "reward": null, "learning_rate": 3.83061809982109e-05, "epoch": 0.64, "percentage": 32.13, "elapsed_time": "6:21:20", "remaining_time": "13:25:21"} +{"current_steps": 2280, "total_steps": 7064, "loss": 0.8291, "reward": null, "learning_rate": 3.821192324420747e-05, "epoch": 0.65, "percentage": 32.28, "elapsed_time": "6:26:57", "remaining_time": "13:31:56"} +{"current_steps": 2280, "total_steps": 7064, "loss": 0.8291, "reward": null, "learning_rate": 3.821192324420747e-05, "epoch": 0.65, "percentage": 32.28, "elapsed_time": "6:23:05", "remaining_time": "13:23:49"} +{"current_steps": 2280, "total_steps": 7064, "loss": 0.8291, "reward": null, "learning_rate": 3.821192324420747e-05, "epoch": 0.65, "percentage": 32.28, "elapsed_time": "6:23:04", "remaining_time": "13:23:47"} +{"current_steps": 2280, "total_steps": 7064, "loss": 0.8291, "reward": null, "learning_rate": 3.821192324420747e-05, "epoch": 0.65, "percentage": 32.28, "elapsed_time": "6:23:06", "remaining_time": "13:23:51"} +{"current_steps": 2290, "total_steps": 7064, "loss": 0.8444, "reward": null, "learning_rate": 3.8117404175594795e-05, "epoch": 0.65, "percentage": 32.42, "elapsed_time": "6:24:49", "remaining_time": "13:22:14"} +{"current_steps": 2290, "total_steps": 7064, "loss": 0.8444, "reward": null, "learning_rate": 3.8117404175594795e-05, "epoch": 0.65, "percentage": 32.42, "elapsed_time": "6:24:47", "remaining_time": "13:22:10"} +{"current_steps": 2290, "total_steps": 7064, "loss": 0.8444, "reward": null, "learning_rate": 3.8117404175594795e-05, "epoch": 0.65, "percentage": 32.42, "elapsed_time": "6:24:48", "remaining_time": "13:22:12"} +{"current_steps": 2290, "total_steps": 7064, "loss": 0.8444, "reward": null, "learning_rate": 3.8117404175594795e-05, "epoch": 0.65, "percentage": 32.42, "elapsed_time": "6:28:40", "remaining_time": "13:30:16"} +{"current_steps": 2300, "total_steps": 7064, "loss": 0.8063, "reward": null, "learning_rate": 3.8022625661836775e-05, "epoch": 0.65, "percentage": 32.56, "elapsed_time": "6:30:20", "remaining_time": "13:28:30"} +{"current_steps": 2300, "total_steps": 7064, "loss": 0.8063, "reward": null, "learning_rate": 3.8022625661836775e-05, "epoch": 0.65, "percentage": 32.56, "elapsed_time": "6:26:29", "remaining_time": "13:20:31"} +{"current_steps": 2300, "total_steps": 7064, "loss": 0.8063, "reward": null, "learning_rate": 3.8022625661836775e-05, "epoch": 0.65, "percentage": 32.56, "elapsed_time": "6:26:27", "remaining_time": "13:20:27"} +{"current_steps": 2300, "total_steps": 7064, "loss": 0.8063, "reward": null, "learning_rate": 3.8022625661836775e-05, "epoch": 0.65, "percentage": 32.56, "elapsed_time": "6:26:28", "remaining_time": "13:20:29"} +{"current_steps": 2310, "total_steps": 7064, "loss": 0.825, "reward": null, "learning_rate": 3.792758957752879e-05, "epoch": 0.65, "percentage": 32.7, "elapsed_time": "6:32:04", "remaining_time": "13:26:53"} +{"current_steps": 2310, "total_steps": 7064, "loss": 0.825, "reward": null, "learning_rate": 3.792758957752879e-05, "epoch": 0.65, "percentage": 32.7, "elapsed_time": "6:28:12", "remaining_time": "13:18:55"} +{"current_steps": 2310, "total_steps": 7064, "loss": 0.825, "reward": null, "learning_rate": 3.792758957752879e-05, "epoch": 0.65, "percentage": 32.7, "elapsed_time": "6:28:11", "remaining_time": "13:18:53"} +{"current_steps": 2310, "total_steps": 7064, "loss": 0.825, "reward": null, "learning_rate": 3.792758957752879e-05, "epoch": 0.65, "percentage": 32.7, "elapsed_time": "6:28:13", "remaining_time": "13:18:57"} +{"current_steps": 2320, "total_steps": 7064, "loss": 0.8244, "reward": null, "learning_rate": 3.783229780236062e-05, "epoch": 0.66, "percentage": 32.84, "elapsed_time": "6:29:53", "remaining_time": "13:17:16"} +{"current_steps": 2320, "total_steps": 7064, "loss": 0.8244, "reward": null, "learning_rate": 3.783229780236062e-05, "epoch": 0.66, "percentage": 32.84, "elapsed_time": "6:33:47", "remaining_time": "13:25:13"} +{"current_steps": 2320, "total_steps": 7064, "loss": 0.8244, "reward": null, "learning_rate": 3.783229780236062e-05, "epoch": 0.66, "percentage": 32.84, "elapsed_time": "6:29:55", "remaining_time": "13:17:20"} +{"current_steps": 2320, "total_steps": 7064, "loss": 0.8244, "reward": null, "learning_rate": 3.783229780236062e-05, "epoch": 0.66, "percentage": 32.84, "elapsed_time": "6:29:54", "remaining_time": "13:17:18"} +{"current_steps": 2330, "total_steps": 7064, "loss": 0.8086, "reward": null, "learning_rate": 3.773675222107929e-05, "epoch": 0.66, "percentage": 32.98, "elapsed_time": "6:35:30", "remaining_time": "13:23:34"} +{"current_steps": 2330, "total_steps": 7064, "loss": 0.8086, "reward": null, "learning_rate": 3.773675222107929e-05, "epoch": 0.66, "percentage": 32.98, "elapsed_time": "6:31:39", "remaining_time": "13:15:44"} +{"current_steps": 2330, "total_steps": 7064, "loss": 0.8086, "reward": null, "learning_rate": 3.773675222107929e-05, "epoch": 0.66, "percentage": 32.98, "elapsed_time": "6:31:38", "remaining_time": "13:15:42"} +{"current_steps": 2330, "total_steps": 7064, "loss": 0.8086, "reward": null, "learning_rate": 3.773675222107929e-05, "epoch": 0.66, "percentage": 32.98, "elapsed_time": "6:31:37", "remaining_time": "13:15:40"} +{"current_steps": 2340, "total_steps": 7064, "loss": 0.823, "reward": null, "learning_rate": 3.7640954723451784e-05, "epoch": 0.66, "percentage": 33.13, "elapsed_time": "6:37:12", "remaining_time": "13:21:53"} +{"current_steps": 2340, "total_steps": 7064, "loss": 0.823, "reward": null, "learning_rate": 3.7640954723451784e-05, "epoch": 0.66, "percentage": 33.13, "elapsed_time": "6:33:19", "remaining_time": "13:14:02"} +{"current_steps": 2340, "total_steps": 7064, "loss": 0.823, "reward": null, "learning_rate": 3.7640954723451784e-05, "epoch": 0.66, "percentage": 33.13, "elapsed_time": "6:33:20", "remaining_time": "13:14:04"} +{"current_steps": 2340, "total_steps": 7064, "loss": 0.823, "reward": null, "learning_rate": 3.7640954723451784e-05, "epoch": 0.66, "percentage": 33.13, "elapsed_time": "6:33:21", "remaining_time": "13:14:06"} +{"current_steps": 2350, "total_steps": 7064, "loss": 0.8177, "reward": null, "learning_rate": 3.7544907204227646e-05, "epoch": 0.67, "percentage": 33.27, "elapsed_time": "6:38:51", "remaining_time": "13:20:06"} +{"current_steps": 2350, "total_steps": 7064, "loss": 0.8177, "reward": null, "learning_rate": 3.7544907204227646e-05, "epoch": 0.67, "percentage": 33.27, "elapsed_time": "6:34:59", "remaining_time": "13:12:20"} +{"current_steps": 2350, "total_steps": 7064, "loss": 0.8177, "reward": null, "learning_rate": 3.7544907204227646e-05, "epoch": 0.67, "percentage": 33.27, "elapsed_time": "6:35:00", "remaining_time": "13:12:22"} +{"current_steps": 2350, "total_steps": 7064, "loss": 0.8177, "reward": null, "learning_rate": 3.7544907204227646e-05, "epoch": 0.67, "percentage": 33.27, "elapsed_time": "6:34:58", "remaining_time": "13:12:18"} +{"current_steps": 2360, "total_steps": 7064, "loss": 0.8142, "reward": null, "learning_rate": 3.7448611563101536e-05, "epoch": 0.67, "percentage": 33.41, "elapsed_time": "6:40:33", "remaining_time": "13:18:24"} +{"current_steps": 2360, "total_steps": 7064, "loss": 0.8142, "reward": null, "learning_rate": 3.7448611563101536e-05, "epoch": 0.67, "percentage": 33.41, "elapsed_time": "6:36:41", "remaining_time": "13:10:41"} +{"current_steps": 2360, "total_steps": 7064, "loss": 0.8142, "reward": null, "learning_rate": 3.7448611563101536e-05, "epoch": 0.67, "percentage": 33.41, "elapsed_time": "6:36:40", "remaining_time": "13:10:39"} +{"current_steps": 2360, "total_steps": 7064, "loss": 0.8142, "reward": null, "learning_rate": 3.7448611563101536e-05, "epoch": 0.67, "percentage": 33.41, "elapsed_time": "6:36:42", "remaining_time": "13:10:43"} +{"current_steps": 2370, "total_steps": 7064, "loss": 0.8236, "reward": null, "learning_rate": 3.735206970467564e-05, "epoch": 0.67, "percentage": 33.55, "elapsed_time": "6:42:16", "remaining_time": "13:16:44"} +{"current_steps": 2370, "total_steps": 7064, "loss": 0.8236, "reward": null, "learning_rate": 3.735206970467564e-05, "epoch": 0.67, "percentage": 33.55, "elapsed_time": "6:38:23", "remaining_time": "13:09:02"} +{"current_steps": 2370, "total_steps": 7064, "loss": 0.8236, "reward": null, "learning_rate": 3.735206970467564e-05, "epoch": 0.67, "percentage": 33.55, "elapsed_time": "6:38:24", "remaining_time": "13:09:04"} +{"current_steps": 2370, "total_steps": 7064, "loss": 0.8236, "reward": null, "learning_rate": 3.735206970467564e-05, "epoch": 0.67, "percentage": 33.55, "elapsed_time": "6:38:25", "remaining_time": "13:09:06"} +{"current_steps": 2380, "total_steps": 7064, "loss": 0.8169, "reward": null, "learning_rate": 3.7255283538421984e-05, "epoch": 0.67, "percentage": 33.69, "elapsed_time": "6:43:59", "remaining_time": "13:15:04"} +{"current_steps": 2380, "total_steps": 7064, "loss": 0.8169, "reward": null, "learning_rate": 3.7255283538421984e-05, "epoch": 0.67, "percentage": 33.69, "elapsed_time": "6:40:06", "remaining_time": "13:07:25"} +{"current_steps": 2380, "total_steps": 7064, "loss": 0.8169, "reward": null, "learning_rate": 3.7255283538421984e-05, "epoch": 0.67, "percentage": 33.69, "elapsed_time": "6:40:08", "remaining_time": "13:07:29"} +{"current_steps": 2380, "total_steps": 7064, "loss": 0.8169, "reward": null, "learning_rate": 3.7255283538421984e-05, "epoch": 0.67, "percentage": 33.69, "elapsed_time": "6:40:07", "remaining_time": "13:07:27"} +{"current_steps": 2390, "total_steps": 7064, "loss": 0.8143, "reward": null, "learning_rate": 3.7158254978644703e-05, "epoch": 0.68, "percentage": 33.83, "elapsed_time": "6:45:40", "remaining_time": "13:13:20"} +{"current_steps": 2390, "total_steps": 7064, "loss": 0.8143, "reward": null, "learning_rate": 3.7158254978644703e-05, "epoch": 0.68, "percentage": 33.83, "elapsed_time": "6:41:47", "remaining_time": "13:05:46"} +{"current_steps": 2390, "total_steps": 7064, "loss": 0.8143, "reward": null, "learning_rate": 3.7158254978644703e-05, "epoch": 0.68, "percentage": 33.83, "elapsed_time": "6:41:46", "remaining_time": "13:05:44"} +{"current_steps": 2390, "total_steps": 7064, "loss": 0.8143, "reward": null, "learning_rate": 3.7158254978644703e-05, "epoch": 0.68, "percentage": 33.83, "elapsed_time": "6:41:48", "remaining_time": "13:05:48"} +{"current_steps": 2400, "total_steps": 7064, "loss": 0.8061, "reward": null, "learning_rate": 3.706098594444216e-05, "epoch": 0.68, "percentage": 33.98, "elapsed_time": "6:47:21", "remaining_time": "13:11:37"} +{"current_steps": 2400, "total_steps": 7064, "loss": 0.8061, "reward": null, "learning_rate": 3.706098594444216e-05, "epoch": 0.68, "percentage": 33.98, "elapsed_time": "6:43:28", "remaining_time": "13:04:04"} +{"current_steps": 2400, "total_steps": 7064, "loss": 0.8061, "reward": null, "learning_rate": 3.706098594444216e-05, "epoch": 0.68, "percentage": 33.98, "elapsed_time": "6:43:29", "remaining_time": "13:04:06"} +{"current_steps": 2400, "total_steps": 7064, "loss": 0.8061, "reward": null, "learning_rate": 3.706098594444216e-05, "epoch": 0.68, "percentage": 33.98, "elapsed_time": "6:43:30", "remaining_time": "13:04:08"} +{"current_steps": 2410, "total_steps": 7064, "loss": 0.8253, "reward": null, "learning_rate": 3.6963478359668966e-05, "epoch": 0.68, "percentage": 34.12, "elapsed_time": "6:45:12", "remaining_time": "13:02:31"} +{"current_steps": 2410, "total_steps": 7064, "loss": 0.8253, "reward": null, "learning_rate": 3.6963478359668966e-05, "epoch": 0.68, "percentage": 34.12, "elapsed_time": "6:49:05", "remaining_time": "13:10:00"} +{"current_steps": 2410, "total_steps": 7064, "loss": 0.8253, "reward": null, "learning_rate": 3.6963478359668966e-05, "epoch": 0.68, "percentage": 34.12, "elapsed_time": "6:45:14", "remaining_time": "13:02:33"} +{"current_steps": 2410, "total_steps": 7064, "loss": 0.8253, "reward": null, "learning_rate": 3.6963478359668966e-05, "epoch": 0.68, "percentage": 34.12, "elapsed_time": "6:45:12", "remaining_time": "13:02:29"} +{"current_steps": 2420, "total_steps": 7064, "loss": 0.812, "reward": null, "learning_rate": 3.6865734152897987e-05, "epoch": 0.69, "percentage": 34.26, "elapsed_time": "6:50:47", "remaining_time": "13:08:18"} +{"current_steps": 2420, "total_steps": 7064, "loss": 0.812, "reward": null, "learning_rate": 3.6865734152897987e-05, "epoch": 0.69, "percentage": 34.26, "elapsed_time": "6:46:55", "remaining_time": "13:00:54"} +{"current_steps": 2420, "total_steps": 7064, "loss": 0.812, "reward": null, "learning_rate": 3.6865734152897987e-05, "epoch": 0.69, "percentage": 34.26, "elapsed_time": "6:46:53", "remaining_time": "13:00:50"} +{"current_steps": 2420, "total_steps": 7064, "loss": 0.812, "reward": null, "learning_rate": 3.6865734152897987e-05, "epoch": 0.69, "percentage": 34.26, "elapsed_time": "6:46:54", "remaining_time": "13:00:52"} +{"current_steps": 2430, "total_steps": 7064, "loss": 0.8263, "reward": null, "learning_rate": 3.676775525738213e-05, "epoch": 0.69, "percentage": 34.4, "elapsed_time": "6:48:40", "remaining_time": "12:59:20"} +{"current_steps": 2430, "total_steps": 7064, "loss": 0.8263, "reward": null, "learning_rate": 3.676775525738213e-05, "epoch": 0.69, "percentage": 34.4, "elapsed_time": "6:48:38", "remaining_time": "12:59:16"} +{"current_steps": 2430, "total_steps": 7064, "loss": 0.8263, "reward": null, "learning_rate": 3.676775525738213e-05, "epoch": 0.69, "percentage": 34.4, "elapsed_time": "6:48:39", "remaining_time": "12:59:18"} +{"current_steps": 2430, "total_steps": 7064, "loss": 0.8263, "reward": null, "learning_rate": 3.676775525738213e-05, "epoch": 0.69, "percentage": 34.4, "elapsed_time": "6:52:31", "remaining_time": "13:06:41"} +{"current_steps": 2440, "total_steps": 7064, "loss": 0.8144, "reward": null, "learning_rate": 3.666954361101616e-05, "epoch": 0.69, "percentage": 34.54, "elapsed_time": "6:50:25", "remaining_time": "12:57:46"} +{"current_steps": 2440, "total_steps": 7064, "loss": 0.8144, "reward": null, "learning_rate": 3.666954361101616e-05, "epoch": 0.69, "percentage": 34.54, "elapsed_time": "6:50:24", "remaining_time": "12:57:44"} +{"current_steps": 2440, "total_steps": 7064, "loss": 0.8144, "reward": null, "learning_rate": 3.666954361101616e-05, "epoch": 0.69, "percentage": 34.54, "elapsed_time": "6:50:23", "remaining_time": "12:57:43"} +{"current_steps": 2440, "total_steps": 7064, "loss": 0.8144, "reward": null, "learning_rate": 3.666954361101616e-05, "epoch": 0.69, "percentage": 34.54, "elapsed_time": "6:54:16", "remaining_time": "13:05:05"} +{"current_steps": 2450, "total_steps": 7064, "loss": 0.8089, "reward": null, "learning_rate": 3.657110115629832e-05, "epoch": 0.69, "percentage": 34.68, "elapsed_time": "6:52:07", "remaining_time": "12:56:09"} +{"current_steps": 2450, "total_steps": 7064, "loss": 0.8089, "reward": null, "learning_rate": 3.657110115629832e-05, "epoch": 0.69, "percentage": 34.68, "elapsed_time": "6:52:06", "remaining_time": "12:56:07"} +{"current_steps": 2450, "total_steps": 7064, "loss": 0.8089, "reward": null, "learning_rate": 3.657110115629832e-05, "epoch": 0.69, "percentage": 34.68, "elapsed_time": "6:52:05", "remaining_time": "12:56:05"} +{"current_steps": 2450, "total_steps": 7064, "loss": 0.8089, "reward": null, "learning_rate": 3.657110115629832e-05, "epoch": 0.69, "percentage": 34.68, "elapsed_time": "6:55:59", "remaining_time": "13:03:24"} +{"current_steps": 2460, "total_steps": 7064, "loss": 0.8155, "reward": null, "learning_rate": 3.647242984029201e-05, "epoch": 0.7, "percentage": 34.82, "elapsed_time": "6:57:40", "remaining_time": "13:01:41"} +{"current_steps": 2460, "total_steps": 7064, "loss": 0.8155, "reward": null, "learning_rate": 3.647242984029201e-05, "epoch": 0.7, "percentage": 34.82, "elapsed_time": "6:53:46", "remaining_time": "12:54:24"} +{"current_steps": 2460, "total_steps": 7064, "loss": 0.8155, "reward": null, "learning_rate": 3.647242984029201e-05, "epoch": 0.7, "percentage": 34.82, "elapsed_time": "6:53:47", "remaining_time": "12:54:26"} +{"current_steps": 2460, "total_steps": 7064, "loss": 0.8155, "reward": null, "learning_rate": 3.647242984029201e-05, "epoch": 0.7, "percentage": 34.82, "elapsed_time": "6:53:48", "remaining_time": "12:54:28"} +{"current_steps": 2470, "total_steps": 7064, "loss": 0.8142, "reward": null, "learning_rate": 3.637353161458713e-05, "epoch": 0.7, "percentage": 34.97, "elapsed_time": "6:59:18", "remaining_time": "12:59:52"} +{"current_steps": 2470, "total_steps": 7064, "loss": 0.8142, "reward": null, "learning_rate": 3.637353161458713e-05, "epoch": 0.7, "percentage": 34.97, "elapsed_time": "6:55:27", "remaining_time": "12:52:42"} +{"current_steps": 2470, "total_steps": 7064, "loss": 0.8142, "reward": null, "learning_rate": 3.637353161458713e-05, "epoch": 0.7, "percentage": 34.97, "elapsed_time": "6:55:25", "remaining_time": "12:52:38"} +{"current_steps": 2470, "total_steps": 7064, "loss": 0.8142, "reward": null, "learning_rate": 3.637353161458713e-05, "epoch": 0.7, "percentage": 34.97, "elapsed_time": "6:55:26", "remaining_time": "12:52:40"} +{"current_steps": 2480, "total_steps": 7064, "loss": 0.8192, "reward": null, "learning_rate": 3.627440843526158e-05, "epoch": 0.7, "percentage": 35.11, "elapsed_time": "7:01:04", "remaining_time": "12:58:18"} +{"current_steps": 2480, "total_steps": 7064, "loss": 0.8192, "reward": null, "learning_rate": 3.627440843526158e-05, "epoch": 0.7, "percentage": 35.11, "elapsed_time": "6:57:12", "remaining_time": "12:51:10"} +{"current_steps": 2480, "total_steps": 7064, "loss": 0.8192, "reward": null, "learning_rate": 3.627440843526158e-05, "epoch": 0.7, "percentage": 35.11, "elapsed_time": "6:57:11", "remaining_time": "12:51:08"} +{"current_steps": 2480, "total_steps": 7064, "loss": 0.8192, "reward": null, "learning_rate": 3.627440843526158e-05, "epoch": 0.7, "percentage": 35.11, "elapsed_time": "6:57:10", "remaining_time": "12:51:06"} +{"current_steps": 2490, "total_steps": 7064, "loss": 0.8134, "reward": null, "learning_rate": 3.6175062262842585e-05, "epoch": 0.7, "percentage": 35.25, "elapsed_time": "6:58:54", "remaining_time": "12:49:30"} +{"current_steps": 2490, "total_steps": 7064, "loss": 0.8134, "reward": null, "learning_rate": 3.6175062262842585e-05, "epoch": 0.7, "percentage": 35.25, "elapsed_time": "6:58:52", "remaining_time": "12:49:26"} +{"current_steps": 2490, "total_steps": 7064, "loss": 0.8134, "reward": null, "learning_rate": 3.6175062262842585e-05, "epoch": 0.7, "percentage": 35.25, "elapsed_time": "6:58:53", "remaining_time": "12:49:28"} +{"current_steps": 2490, "total_steps": 7064, "loss": 0.8134, "reward": null, "learning_rate": 3.6175062262842585e-05, "epoch": 0.7, "percentage": 35.25, "elapsed_time": "7:02:45", "remaining_time": "12:56:35"} +{"current_steps": 2500, "total_steps": 7064, "loss": 0.8175, "reward": null, "learning_rate": 3.607549506226784e-05, "epoch": 0.71, "percentage": 35.39, "elapsed_time": "7:00:31", "remaining_time": "12:47:43"} +{"current_steps": 2500, "total_steps": 7064, "loss": 0.8175, "reward": null, "learning_rate": 3.607549506226784e-05, "epoch": 0.71, "percentage": 35.39, "elapsed_time": "7:00:32", "remaining_time": "12:47:45"} +{"current_steps": 2500, "total_steps": 7064, "loss": 0.8175, "reward": null, "learning_rate": 3.607549506226784e-05, "epoch": 0.71, "percentage": 35.39, "elapsed_time": "7:00:30", "remaining_time": "12:47:41"} +{"current_steps": 2500, "total_steps": 7064, "loss": 0.8175, "reward": null, "learning_rate": 3.607549506226784e-05, "epoch": 0.71, "percentage": 35.39, "elapsed_time": "7:04:24", "remaining_time": "12:54:47"} +{"current_steps": 2510, "total_steps": 7064, "loss": 0.8192, "reward": null, "learning_rate": 3.5975708802846725e-05, "epoch": 0.71, "percentage": 35.53, "elapsed_time": "7:06:08", "remaining_time": "12:53:09"} +{"current_steps": 2510, "total_steps": 7064, "loss": 0.8192, "reward": null, "learning_rate": 3.5975708802846725e-05, "epoch": 0.71, "percentage": 35.53, "elapsed_time": "7:02:14", "remaining_time": "12:46:05"} +{"current_steps": 2510, "total_steps": 7064, "loss": 0.8192, "reward": null, "learning_rate": 3.5975708802846725e-05, "epoch": 0.71, "percentage": 35.53, "elapsed_time": "7:02:16", "remaining_time": "12:46:09"} +{"current_steps": 2510, "total_steps": 7064, "loss": 0.8192, "reward": null, "learning_rate": 3.5975708802846725e-05, "epoch": 0.71, "percentage": 35.53, "elapsed_time": "7:02:15", "remaining_time": "12:46:07"} +{"current_steps": 2520, "total_steps": 7064, "loss": 0.8348, "reward": null, "learning_rate": 3.587570545822128e-05, "epoch": 0.71, "percentage": 35.67, "elapsed_time": "7:07:50", "remaining_time": "12:51:27"} +{"current_steps": 2520, "total_steps": 7064, "loss": 0.8348, "reward": null, "learning_rate": 3.587570545822128e-05, "epoch": 0.71, "percentage": 35.67, "elapsed_time": "7:03:58", "remaining_time": "12:44:30"} +{"current_steps": 2520, "total_steps": 7064, "loss": 0.8348, "reward": null, "learning_rate": 3.587570545822128e-05, "epoch": 0.71, "percentage": 35.67, "elapsed_time": "7:03:56", "remaining_time": "12:44:26"} +{"current_steps": 2520, "total_steps": 7064, "loss": 0.8348, "reward": null, "learning_rate": 3.587570545822128e-05, "epoch": 0.71, "percentage": 35.67, "elapsed_time": "7:03:57", "remaining_time": "12:44:28"} +{"current_steps": 2530, "total_steps": 7064, "loss": 0.8147, "reward": null, "learning_rate": 3.5775487006327215e-05, "epoch": 0.72, "percentage": 35.82, "elapsed_time": "7:09:29", "remaining_time": "12:49:41"} +{"current_steps": 2530, "total_steps": 7064, "loss": 0.8147, "reward": null, "learning_rate": 3.5775487006327215e-05, "epoch": 0.72, "percentage": 35.82, "elapsed_time": "7:05:38", "remaining_time": "12:42:46"} +{"current_steps": 2530, "total_steps": 7064, "loss": 0.8147, "reward": null, "learning_rate": 3.5775487006327215e-05, "epoch": 0.72, "percentage": 35.82, "elapsed_time": "7:05:36", "remaining_time": "12:42:44"} +{"current_steps": 2530, "total_steps": 7064, "loss": 0.8147, "reward": null, "learning_rate": 3.5775487006327215e-05, "epoch": 0.72, "percentage": 35.82, "elapsed_time": "7:05:36", "remaining_time": "12:42:42"} +{"current_steps": 2540, "total_steps": 7064, "loss": 0.8235, "reward": null, "learning_rate": 3.567505542935482e-05, "epoch": 0.72, "percentage": 35.96, "elapsed_time": "7:11:09", "remaining_time": "12:47:55"} +{"current_steps": 2540, "total_steps": 7064, "loss": 0.8235, "reward": null, "learning_rate": 3.567505542935482e-05, "epoch": 0.72, "percentage": 35.96, "elapsed_time": "7:07:16", "remaining_time": "12:41:01"} +{"current_steps": 2540, "total_steps": 7064, "loss": 0.8235, "reward": null, "learning_rate": 3.567505542935482e-05, "epoch": 0.72, "percentage": 35.96, "elapsed_time": "7:07:15", "remaining_time": "12:41:00"} +{"current_steps": 2540, "total_steps": 7064, "loss": 0.8235, "reward": null, "learning_rate": 3.567505542935482e-05, "epoch": 0.72, "percentage": 35.96, "elapsed_time": "7:07:17", "remaining_time": "12:41:03"} +{"current_steps": 2550, "total_steps": 7064, "loss": 0.8175, "reward": null, "learning_rate": 3.557441271370968e-05, "epoch": 0.72, "percentage": 36.1, "elapsed_time": "7:12:49", "remaining_time": "12:46:10"} +{"current_steps": 2550, "total_steps": 7064, "loss": 0.8175, "reward": null, "learning_rate": 3.557441271370968e-05, "epoch": 0.72, "percentage": 36.1, "elapsed_time": "7:08:57", "remaining_time": "12:39:21"} +{"current_steps": 2550, "total_steps": 7064, "loss": 0.8175, "reward": null, "learning_rate": 3.557441271370968e-05, "epoch": 0.72, "percentage": 36.1, "elapsed_time": "7:08:56", "remaining_time": "12:39:19"} +{"current_steps": 2550, "total_steps": 7064, "loss": 0.8175, "reward": null, "learning_rate": 3.557441271370968e-05, "epoch": 0.72, "percentage": 36.1, "elapsed_time": "7:08:55", "remaining_time": "12:39:17"} +{"current_steps": 2560, "total_steps": 7064, "loss": 0.8197, "reward": null, "learning_rate": 3.547356084997344e-05, "epoch": 0.72, "percentage": 36.24, "elapsed_time": "7:14:34", "remaining_time": "12:44:34"} +{"current_steps": 2560, "total_steps": 7064, "loss": 0.8197, "reward": null, "learning_rate": 3.547356084997344e-05, "epoch": 0.72, "percentage": 36.24, "elapsed_time": "7:10:41", "remaining_time": "12:37:44"} +{"current_steps": 2560, "total_steps": 7064, "loss": 0.8197, "reward": null, "learning_rate": 3.547356084997344e-05, "epoch": 0.72, "percentage": 36.24, "elapsed_time": "7:10:43", "remaining_time": "12:37:47"} +{"current_steps": 2560, "total_steps": 7064, "loss": 0.8197, "reward": null, "learning_rate": 3.547356084997344e-05, "epoch": 0.72, "percentage": 36.24, "elapsed_time": "7:10:41", "remaining_time": "12:37:45"} +{"current_steps": 2570, "total_steps": 7064, "loss": 0.808, "reward": null, "learning_rate": 3.537250183286443e-05, "epoch": 0.73, "percentage": 36.38, "elapsed_time": "7:16:17", "remaining_time": "12:42:54"} +{"current_steps": 2570, "total_steps": 7064, "loss": 0.808, "reward": null, "learning_rate": 3.537250183286443e-05, "epoch": 0.73, "percentage": 36.38, "elapsed_time": "7:12:24", "remaining_time": "12:36:07"} +{"current_steps": 2570, "total_steps": 7064, "loss": 0.808, "reward": null, "learning_rate": 3.537250183286443e-05, "epoch": 0.73, "percentage": 36.38, "elapsed_time": "7:12:23", "remaining_time": "12:36:06"} +{"current_steps": 2570, "total_steps": 7064, "loss": 0.808, "reward": null, "learning_rate": 3.537250183286443e-05, "epoch": 0.73, "percentage": 36.38, "elapsed_time": "7:12:25", "remaining_time": "12:36:09"} +{"current_steps": 2580, "total_steps": 7064, "loss": 0.8154, "reward": null, "learning_rate": 3.527123766119818e-05, "epoch": 0.73, "percentage": 36.52, "elapsed_time": "7:17:59", "remaining_time": "12:41:12"} +{"current_steps": 2580, "total_steps": 7064, "loss": 0.8154, "reward": null, "learning_rate": 3.527123766119818e-05, "epoch": 0.73, "percentage": 36.52, "elapsed_time": "7:14:05", "remaining_time": "12:34:27"} +{"current_steps": 2580, "total_steps": 7064, "loss": 0.8154, "reward": null, "learning_rate": 3.527123766119818e-05, "epoch": 0.73, "percentage": 36.52, "elapsed_time": "7:14:06", "remaining_time": "12:34:29"} +{"current_steps": 2580, "total_steps": 7064, "loss": 0.8154, "reward": null, "learning_rate": 3.527123766119818e-05, "epoch": 0.73, "percentage": 36.52, "elapsed_time": "7:14:07", "remaining_time": "12:34:30"} +{"current_steps": 2590, "total_steps": 7064, "loss": 0.8104, "reward": null, "learning_rate": 3.5169770337847935e-05, "epoch": 0.73, "percentage": 36.66, "elapsed_time": "7:15:47", "remaining_time": "12:32:48"} +{"current_steps": 2590, "total_steps": 7064, "loss": 0.8104, "reward": null, "learning_rate": 3.5169770337847935e-05, "epoch": 0.73, "percentage": 36.66, "elapsed_time": "7:15:45", "remaining_time": "12:32:44"} +{"current_steps": 2590, "total_steps": 7064, "loss": 0.8104, "reward": null, "learning_rate": 3.5169770337847935e-05, "epoch": 0.73, "percentage": 36.66, "elapsed_time": "7:15:46", "remaining_time": "12:32:46"} +{"current_steps": 2590, "total_steps": 7064, "loss": 0.8104, "reward": null, "learning_rate": 3.5169770337847935e-05, "epoch": 0.73, "percentage": 36.66, "elapsed_time": "7:19:39", "remaining_time": "12:39:27"} +{"current_steps": 2600, "total_steps": 7064, "loss": 0.8318, "reward": null, "learning_rate": 3.5068101869705004e-05, "epoch": 0.74, "percentage": 36.81, "elapsed_time": "7:21:20", "remaining_time": "12:37:45"} +{"current_steps": 2600, "total_steps": 7064, "loss": 0.8318, "reward": null, "learning_rate": 3.5068101869705004e-05, "epoch": 0.74, "percentage": 36.81, "elapsed_time": "7:17:28", "remaining_time": "12:31:06"} +{"current_steps": 2600, "total_steps": 7064, "loss": 0.8318, "reward": null, "learning_rate": 3.5068101869705004e-05, "epoch": 0.74, "percentage": 36.81, "elapsed_time": "7:17:29", "remaining_time": "12:31:08"} +{"current_steps": 2600, "total_steps": 7064, "loss": 0.8318, "reward": null, "learning_rate": 3.5068101869705004e-05, "epoch": 0.74, "percentage": 36.81, "elapsed_time": "7:17:27", "remaining_time": "12:31:04"} +{"current_steps": 2610, "total_steps": 7064, "loss": 0.8146, "reward": null, "learning_rate": 3.496623426763908e-05, "epoch": 0.74, "percentage": 36.95, "elapsed_time": "7:23:02", "remaining_time": "12:36:04"} +{"current_steps": 2610, "total_steps": 7064, "loss": 0.8146, "reward": null, "learning_rate": 3.496623426763908e-05, "epoch": 0.74, "percentage": 36.95, "elapsed_time": "7:19:11", "remaining_time": "12:29:29"} +{"current_steps": 2610, "total_steps": 7064, "loss": 0.8146, "reward": null, "learning_rate": 3.496623426763908e-05, "epoch": 0.74, "percentage": 36.95, "elapsed_time": "7:19:10", "remaining_time": "12:29:27"} +{"current_steps": 2610, "total_steps": 7064, "loss": 0.8146, "reward": null, "learning_rate": 3.496623426763908e-05, "epoch": 0.74, "percentage": 36.95, "elapsed_time": "7:19:09", "remaining_time": "12:29:26"} +{"current_steps": 2620, "total_steps": 7064, "loss": 0.8097, "reward": null, "learning_rate": 3.486416954645846e-05, "epoch": 0.74, "percentage": 37.09, "elapsed_time": "7:20:54", "remaining_time": "12:27:51"} +{"current_steps": 2620, "total_steps": 7064, "loss": 0.8097, "reward": null, "learning_rate": 3.486416954645846e-05, "epoch": 0.74, "percentage": 37.09, "elapsed_time": "7:20:55", "remaining_time": "12:27:53"} +{"current_steps": 2620, "total_steps": 7064, "loss": 0.8097, "reward": null, "learning_rate": 3.486416954645846e-05, "epoch": 0.74, "percentage": 37.09, "elapsed_time": "7:20:53", "remaining_time": "12:27:49"} +{"current_steps": 2620, "total_steps": 7064, "loss": 0.8097, "reward": null, "learning_rate": 3.486416954645846e-05, "epoch": 0.74, "percentage": 37.09, "elapsed_time": "7:24:46", "remaining_time": "12:34:25"} +{"current_steps": 2630, "total_steps": 7064, "loss": 0.8176, "reward": null, "learning_rate": 3.4761909724870205e-05, "epoch": 0.74, "percentage": 37.23, "elapsed_time": "7:26:31", "remaining_time": "12:32:49"} +{"current_steps": 2630, "total_steps": 7064, "loss": 0.8176, "reward": null, "learning_rate": 3.4761909724870205e-05, "epoch": 0.74, "percentage": 37.23, "elapsed_time": "7:22:39", "remaining_time": "12:26:17"} +{"current_steps": 2630, "total_steps": 7064, "loss": 0.8176, "reward": null, "learning_rate": 3.4761909724870205e-05, "epoch": 0.74, "percentage": 37.23, "elapsed_time": "7:22:38", "remaining_time": "12:26:16"} +{"current_steps": 2630, "total_steps": 7064, "loss": 0.8176, "reward": null, "learning_rate": 3.4761909724870205e-05, "epoch": 0.74, "percentage": 37.23, "elapsed_time": "7:22:40", "remaining_time": "12:26:19"} +{"current_steps": 2640, "total_steps": 7064, "loss": 0.8284, "reward": null, "learning_rate": 3.4659456825440216e-05, "epoch": 0.75, "percentage": 37.37, "elapsed_time": "7:28:10", "remaining_time": "12:31:02"} +{"current_steps": 2640, "total_steps": 7064, "loss": 0.8284, "reward": null, "learning_rate": 3.4659456825440216e-05, "epoch": 0.75, "percentage": 37.37, "elapsed_time": "7:24:19", "remaining_time": "12:24:34"} +{"current_steps": 2640, "total_steps": 7064, "loss": 0.8284, "reward": null, "learning_rate": 3.4659456825440216e-05, "epoch": 0.75, "percentage": 37.37, "elapsed_time": "7:24:17", "remaining_time": "12:24:31"} +{"current_steps": 2640, "total_steps": 7064, "loss": 0.8284, "reward": null, "learning_rate": 3.4659456825440216e-05, "epoch": 0.75, "percentage": 37.37, "elapsed_time": "7:24:18", "remaining_time": "12:24:33"} +{"current_steps": 2650, "total_steps": 7064, "loss": 0.8159, "reward": null, "learning_rate": 3.4556812874553204e-05, "epoch": 0.75, "percentage": 37.51, "elapsed_time": "7:29:53", "remaining_time": "12:29:22"} +{"current_steps": 2650, "total_steps": 7064, "loss": 0.8159, "reward": null, "learning_rate": 3.4556812874553204e-05, "epoch": 0.75, "percentage": 37.51, "elapsed_time": "7:26:01", "remaining_time": "12:22:55"} +{"current_steps": 2650, "total_steps": 7064, "loss": 0.8159, "reward": null, "learning_rate": 3.4556812874553204e-05, "epoch": 0.75, "percentage": 37.51, "elapsed_time": "7:26:02", "remaining_time": "12:22:56"} +{"current_steps": 2650, "total_steps": 7064, "loss": 0.8159, "reward": null, "learning_rate": 3.4556812874553204e-05, "epoch": 0.75, "percentage": 37.51, "elapsed_time": "7:26:00", "remaining_time": "12:22:53"} +{"current_steps": 2660, "total_steps": 7064, "loss": 0.8204, "reward": null, "learning_rate": 3.445397990237264e-05, "epoch": 0.75, "percentage": 37.66, "elapsed_time": "7:27:38", "remaining_time": "12:21:08"} +{"current_steps": 2660, "total_steps": 7064, "loss": 0.8204, "reward": null, "learning_rate": 3.445397990237264e-05, "epoch": 0.75, "percentage": 37.66, "elapsed_time": "7:27:41", "remaining_time": "12:21:12"} +{"current_steps": 2660, "total_steps": 7064, "loss": 0.8204, "reward": null, "learning_rate": 3.445397990237264e-05, "epoch": 0.75, "percentage": 37.66, "elapsed_time": "7:27:39", "remaining_time": "12:21:10"} +{"current_steps": 2660, "total_steps": 7064, "loss": 0.8204, "reward": null, "learning_rate": 3.445397990237264e-05, "epoch": 0.75, "percentage": 37.66, "elapsed_time": "7:31:32", "remaining_time": "12:27:35"} +{"current_steps": 2670, "total_steps": 7064, "loss": 0.8013, "reward": null, "learning_rate": 3.4350959942800584e-05, "epoch": 0.76, "percentage": 37.8, "elapsed_time": "7:33:12", "remaining_time": "12:25:51"} +{"current_steps": 2670, "total_steps": 7064, "loss": 0.8013, "reward": null, "learning_rate": 3.4350959942800584e-05, "epoch": 0.76, "percentage": 37.8, "elapsed_time": "7:29:21", "remaining_time": "12:19:30"} +{"current_steps": 2670, "total_steps": 7064, "loss": 0.8013, "reward": null, "learning_rate": 3.4350959942800584e-05, "epoch": 0.76, "percentage": 37.8, "elapsed_time": "7:29:19", "remaining_time": "12:19:27"} +{"current_steps": 2670, "total_steps": 7064, "loss": 0.8013, "reward": null, "learning_rate": 3.4350959942800584e-05, "epoch": 0.76, "percentage": 37.8, "elapsed_time": "7:29:20", "remaining_time": "12:19:28"} +{"current_steps": 2680, "total_steps": 7064, "loss": 0.8196, "reward": null, "learning_rate": 3.424775503343747e-05, "epoch": 0.76, "percentage": 37.94, "elapsed_time": "7:31:00", "remaining_time": "12:17:45"} +{"current_steps": 2680, "total_steps": 7064, "loss": 0.8196, "reward": null, "learning_rate": 3.424775503343747e-05, "epoch": 0.76, "percentage": 37.94, "elapsed_time": "7:30:58", "remaining_time": "12:17:42"} +{"current_steps": 2680, "total_steps": 7064, "loss": 0.8196, "reward": null, "learning_rate": 3.424775503343747e-05, "epoch": 0.76, "percentage": 37.94, "elapsed_time": "7:30:58", "remaining_time": "12:17:43"} +{"current_steps": 2680, "total_steps": 7064, "loss": 0.8196, "reward": null, "learning_rate": 3.424775503343747e-05, "epoch": 0.76, "percentage": 37.94, "elapsed_time": "7:34:51", "remaining_time": "12:24:03"} +{"current_steps": 2690, "total_steps": 7064, "loss": 0.802, "reward": null, "learning_rate": 3.414436721554179e-05, "epoch": 0.76, "percentage": 38.08, "elapsed_time": "7:36:32", "remaining_time": "12:22:20"} +{"current_steps": 2690, "total_steps": 7064, "loss": 0.802, "reward": null, "learning_rate": 3.414436721554179e-05, "epoch": 0.76, "percentage": 38.08, "elapsed_time": "7:32:39", "remaining_time": "12:16:02"} +{"current_steps": 2690, "total_steps": 7064, "loss": 0.802, "reward": null, "learning_rate": 3.414436721554179e-05, "epoch": 0.76, "percentage": 38.08, "elapsed_time": "7:32:38", "remaining_time": "12:16:00"} +{"current_steps": 2690, "total_steps": 7064, "loss": 0.802, "reward": null, "learning_rate": 3.414436721554179e-05, "epoch": 0.76, "percentage": 38.08, "elapsed_time": "7:32:40", "remaining_time": "12:16:04"} +{"current_steps": 2700, "total_steps": 7064, "loss": 0.8204, "reward": null, "learning_rate": 3.4040798533989745e-05, "epoch": 0.76, "percentage": 38.22, "elapsed_time": "7:38:15", "remaining_time": "12:20:40"} +{"current_steps": 2700, "total_steps": 7064, "loss": 0.8204, "reward": null, "learning_rate": 3.4040798533989745e-05, "epoch": 0.76, "percentage": 38.22, "elapsed_time": "7:34:23", "remaining_time": "12:14:25"} +{"current_steps": 2700, "total_steps": 7064, "loss": 0.8204, "reward": null, "learning_rate": 3.4040798533989745e-05, "epoch": 0.76, "percentage": 38.22, "elapsed_time": "7:34:22", "remaining_time": "12:14:23"} +{"current_steps": 2700, "total_steps": 7064, "loss": 0.8204, "reward": null, "learning_rate": 3.4040798533989745e-05, "epoch": 0.76, "percentage": 38.22, "elapsed_time": "7:34:24", "remaining_time": "12:14:27"} +{"current_steps": 2710, "total_steps": 7064, "loss": 0.8055, "reward": null, "learning_rate": 3.3937051037234745e-05, "epoch": 0.77, "percentage": 38.36, "elapsed_time": "7:39:58", "remaining_time": "12:19:01"} +{"current_steps": 2710, "total_steps": 7064, "loss": 0.8055, "reward": null, "learning_rate": 3.3937051037234745e-05, "epoch": 0.77, "percentage": 38.36, "elapsed_time": "7:36:07", "remaining_time": "12:12:49"} +{"current_steps": 2710, "total_steps": 7064, "loss": 0.8055, "reward": null, "learning_rate": 3.3937051037234745e-05, "epoch": 0.77, "percentage": 38.36, "elapsed_time": "7:36:06", "remaining_time": "12:12:47"} +{"current_steps": 2710, "total_steps": 7064, "loss": 0.8055, "reward": null, "learning_rate": 3.3937051037234745e-05, "epoch": 0.77, "percentage": 38.36, "elapsed_time": "7:36:05", "remaining_time": "12:12:46"} +{"current_steps": 2720, "total_steps": 7064, "loss": 0.8171, "reward": null, "learning_rate": 3.3833126777266974e-05, "epoch": 0.77, "percentage": 38.51, "elapsed_time": "7:41:40", "remaining_time": "12:17:19"} +{"current_steps": 2720, "total_steps": 7064, "loss": 0.8171, "reward": null, "learning_rate": 3.3833126777266974e-05, "epoch": 0.77, "percentage": 38.51, "elapsed_time": "7:37:49", "remaining_time": "12:11:09"} +{"current_steps": 2720, "total_steps": 7064, "loss": 0.8171, "reward": null, "learning_rate": 3.3833126777266974e-05, "epoch": 0.77, "percentage": 38.51, "elapsed_time": "7:37:47", "remaining_time": "12:11:07"} +{"current_steps": 2720, "total_steps": 7064, "loss": 0.8171, "reward": null, "learning_rate": 3.3833126777266974e-05, "epoch": 0.77, "percentage": 38.51, "elapsed_time": "7:37:47", "remaining_time": "12:11:06"} +{"current_steps": 2730, "total_steps": 7064, "loss": 0.8222, "reward": null, "learning_rate": 3.3729027809572735e-05, "epoch": 0.77, "percentage": 38.65, "elapsed_time": "7:43:23", "remaining_time": "12:15:39"} +{"current_steps": 2730, "total_steps": 7064, "loss": 0.8222, "reward": null, "learning_rate": 3.3729027809572735e-05, "epoch": 0.77, "percentage": 38.65, "elapsed_time": "7:39:32", "remaining_time": "12:09:32"} +{"current_steps": 2730, "total_steps": 7064, "loss": 0.8222, "reward": null, "learning_rate": 3.3729027809572735e-05, "epoch": 0.77, "percentage": 38.65, "elapsed_time": "7:39:30", "remaining_time": "12:09:29"} +{"current_steps": 2730, "total_steps": 7064, "loss": 0.8222, "reward": null, "learning_rate": 3.3729027809572735e-05, "epoch": 0.77, "percentage": 38.65, "elapsed_time": "7:39:31", "remaining_time": "12:09:30"} +{"current_steps": 2740, "total_steps": 7064, "loss": 0.8104, "reward": null, "learning_rate": 3.3624756193093835e-05, "epoch": 0.78, "percentage": 38.79, "elapsed_time": "7:45:03", "remaining_time": "12:13:55"} +{"current_steps": 2740, "total_steps": 7064, "loss": 0.8104, "reward": null, "learning_rate": 3.3624756193093835e-05, "epoch": 0.78, "percentage": 38.79, "elapsed_time": "7:41:12", "remaining_time": "12:07:50"} +{"current_steps": 2740, "total_steps": 7064, "loss": 0.8104, "reward": null, "learning_rate": 3.3624756193093835e-05, "epoch": 0.78, "percentage": 38.79, "elapsed_time": "7:41:11", "remaining_time": "12:07:48"} +{"current_steps": 2740, "total_steps": 7064, "loss": 0.8104, "reward": null, "learning_rate": 3.3624756193093835e-05, "epoch": 0.78, "percentage": 38.79, "elapsed_time": "7:41:10", "remaining_time": "12:07:46"} +{"current_steps": 2750, "total_steps": 7064, "loss": 0.8147, "reward": null, "learning_rate": 3.3520313990186856e-05, "epoch": 0.78, "percentage": 38.93, "elapsed_time": "7:42:53", "remaining_time": "12:06:09"} +{"current_steps": 2750, "total_steps": 7064, "loss": 0.8147, "reward": null, "learning_rate": 3.3520313990186856e-05, "epoch": 0.78, "percentage": 38.93, "elapsed_time": "7:42:54", "remaining_time": "12:06:11"} +{"current_steps": 2750, "total_steps": 7064, "loss": 0.8147, "reward": null, "learning_rate": 3.3520313990186856e-05, "epoch": 0.78, "percentage": 38.93, "elapsed_time": "7:42:52", "remaining_time": "12:06:07"} +{"current_steps": 2750, "total_steps": 7064, "loss": 0.8147, "reward": null, "learning_rate": 3.3520313990186856e-05, "epoch": 0.78, "percentage": 38.93, "elapsed_time": "7:46:46", "remaining_time": "12:12:13"} +{"current_steps": 2760, "total_steps": 7064, "loss": 0.8017, "reward": null, "learning_rate": 3.341570326658232e-05, "epoch": 0.78, "percentage": 39.07, "elapsed_time": "7:48:23", "remaining_time": "12:10:25"} +{"current_steps": 2760, "total_steps": 7064, "loss": 0.8017, "reward": null, "learning_rate": 3.341570326658232e-05, "epoch": 0.78, "percentage": 39.07, "elapsed_time": "7:44:32", "remaining_time": "12:04:25"} +{"current_steps": 2760, "total_steps": 7064, "loss": 0.8017, "reward": null, "learning_rate": 3.341570326658232e-05, "epoch": 0.78, "percentage": 39.07, "elapsed_time": "7:44:31", "remaining_time": "12:04:23"} +{"current_steps": 2760, "total_steps": 7064, "loss": 0.8017, "reward": null, "learning_rate": 3.341570326658232e-05, "epoch": 0.78, "percentage": 39.07, "elapsed_time": "7:44:30", "remaining_time": "12:04:21"} +{"current_steps": 2770, "total_steps": 7064, "loss": 0.8059, "reward": null, "learning_rate": 3.331092609134392e-05, "epoch": 0.78, "percentage": 39.21, "elapsed_time": "7:50:07", "remaining_time": "12:08:47"} +{"current_steps": 2770, "total_steps": 7064, "loss": 0.8059, "reward": null, "learning_rate": 3.331092609134392e-05, "epoch": 0.78, "percentage": 39.21, "elapsed_time": "7:46:15", "remaining_time": "12:02:46"} +{"current_steps": 2770, "total_steps": 7064, "loss": 0.8059, "reward": null, "learning_rate": 3.331092609134392e-05, "epoch": 0.78, "percentage": 39.21, "elapsed_time": "7:46:16", "remaining_time": "12:02:48"} +{"current_steps": 2770, "total_steps": 7064, "loss": 0.8059, "reward": null, "learning_rate": 3.331092609134392e-05, "epoch": 0.78, "percentage": 39.21, "elapsed_time": "7:46:14", "remaining_time": "12:02:45"} +{"current_steps": 2780, "total_steps": 7064, "loss": 0.8204, "reward": null, "learning_rate": 3.32059845368275e-05, "epoch": 0.79, "percentage": 39.35, "elapsed_time": "7:51:50", "remaining_time": "12:07:07"} +{"current_steps": 2780, "total_steps": 7064, "loss": 0.8204, "reward": null, "learning_rate": 3.32059845368275e-05, "epoch": 0.79, "percentage": 39.35, "elapsed_time": "7:47:58", "remaining_time": "12:01:09"} +{"current_steps": 2780, "total_steps": 7064, "loss": 0.8204, "reward": null, "learning_rate": 3.32059845368275e-05, "epoch": 0.79, "percentage": 39.35, "elapsed_time": "7:47:57", "remaining_time": "12:01:07"} +{"current_steps": 2780, "total_steps": 7064, "loss": 0.8204, "reward": null, "learning_rate": 3.32059845368275e-05, "epoch": 0.79, "percentage": 39.35, "elapsed_time": "7:47:59", "remaining_time": "12:01:10"} +{"current_steps": 2790, "total_steps": 7064, "loss": 0.812, "reward": null, "learning_rate": 3.310088067864015e-05, "epoch": 0.79, "percentage": 39.5, "elapsed_time": "7:53:33", "remaining_time": "12:05:27"} +{"current_steps": 2790, "total_steps": 7064, "loss": 0.812, "reward": null, "learning_rate": 3.310088067864015e-05, "epoch": 0.79, "percentage": 39.5, "elapsed_time": "7:49:42", "remaining_time": "11:59:33"} +{"current_steps": 2790, "total_steps": 7064, "loss": 0.812, "reward": null, "learning_rate": 3.310088067864015e-05, "epoch": 0.79, "percentage": 39.5, "elapsed_time": "7:49:40", "remaining_time": "11:59:29"} +{"current_steps": 2790, "total_steps": 7064, "loss": 0.812, "reward": null, "learning_rate": 3.310088067864015e-05, "epoch": 0.79, "percentage": 39.5, "elapsed_time": "7:49:41", "remaining_time": "11:59:31"} +{"current_steps": 2800, "total_steps": 7064, "loss": 0.8087, "reward": null, "learning_rate": 3.299561659559909e-05, "epoch": 0.79, "percentage": 39.64, "elapsed_time": "7:55:15", "remaining_time": "12:03:45"} +{"current_steps": 2800, "total_steps": 7064, "loss": 0.8087, "reward": null, "learning_rate": 3.299561659559909e-05, "epoch": 0.79, "percentage": 39.64, "elapsed_time": "7:51:24", "remaining_time": "11:57:52"} +{"current_steps": 2800, "total_steps": 7064, "loss": 0.8087, "reward": null, "learning_rate": 3.299561659559909e-05, "epoch": 0.79, "percentage": 39.64, "elapsed_time": "7:51:22", "remaining_time": "11:57:49"} +{"current_steps": 2800, "total_steps": 7064, "loss": 0.8087, "reward": null, "learning_rate": 3.299561659559909e-05, "epoch": 0.79, "percentage": 39.64, "elapsed_time": "7:51:23", "remaining_time": "11:57:51"} +{"current_steps": 2810, "total_steps": 7064, "loss": 0.8038, "reward": null, "learning_rate": 3.289019436969057e-05, "epoch": 0.8, "percentage": 39.78, "elapsed_time": "7:53:06", "remaining_time": "11:56:14"} +{"current_steps": 2810, "total_steps": 7064, "loss": 0.8038, "reward": null, "learning_rate": 3.289019436969057e-05, "epoch": 0.8, "percentage": 39.78, "elapsed_time": "7:53:05", "remaining_time": "11:56:12"} +{"current_steps": 2810, "total_steps": 7064, "loss": 0.8038, "reward": null, "learning_rate": 3.289019436969057e-05, "epoch": 0.8, "percentage": 39.78, "elapsed_time": "7:53:04", "remaining_time": "11:56:11"} +{"current_steps": 2810, "total_steps": 7064, "loss": 0.8038, "reward": null, "learning_rate": 3.289019436969057e-05, "epoch": 0.8, "percentage": 39.78, "elapsed_time": "7:56:58", "remaining_time": "12:02:04"} +{"current_steps": 2820, "total_steps": 7064, "loss": 0.8094, "reward": null, "learning_rate": 3.278461608602873e-05, "epoch": 0.8, "percentage": 39.92, "elapsed_time": "7:54:49", "remaining_time": "11:54:35"} +{"current_steps": 2820, "total_steps": 7064, "loss": 0.8094, "reward": null, "learning_rate": 3.278461608602873e-05, "epoch": 0.8, "percentage": 39.92, "elapsed_time": "7:58:41", "remaining_time": "12:00:24"} +{"current_steps": 2820, "total_steps": 7064, "loss": 0.8094, "reward": null, "learning_rate": 3.278461608602873e-05, "epoch": 0.8, "percentage": 39.92, "elapsed_time": "7:54:48", "remaining_time": "11:54:33"} +{"current_steps": 2820, "total_steps": 7064, "loss": 0.8094, "reward": null, "learning_rate": 3.278461608602873e-05, "epoch": 0.8, "percentage": 39.92, "elapsed_time": "7:54:50", "remaining_time": "11:54:36"} +{"current_steps": 2830, "total_steps": 7064, "loss": 0.8182, "reward": null, "learning_rate": 3.267888383281431e-05, "epoch": 0.8, "percentage": 40.06, "elapsed_time": "8:00:22", "remaining_time": "11:58:41"} +{"current_steps": 2830, "total_steps": 7064, "loss": 0.8182, "reward": null, "learning_rate": 3.267888383281431e-05, "epoch": 0.8, "percentage": 40.06, "elapsed_time": "7:56:29", "remaining_time": "11:52:52"} +{"current_steps": 2830, "total_steps": 7064, "loss": 0.8182, "reward": null, "learning_rate": 3.267888383281431e-05, "epoch": 0.8, "percentage": 40.06, "elapsed_time": "7:56:30", "remaining_time": "11:52:54"} +{"current_steps": 2830, "total_steps": 7064, "loss": 0.8182, "reward": null, "learning_rate": 3.267888383281431e-05, "epoch": 0.8, "percentage": 40.06, "elapsed_time": "7:56:31", "remaining_time": "11:52:55"} +{"current_steps": 2840, "total_steps": 7064, "loss": 0.812, "reward": null, "learning_rate": 3.257299970129336e-05, "epoch": 0.8, "percentage": 40.2, "elapsed_time": "7:58:13", "remaining_time": "11:51:16"} +{"current_steps": 2840, "total_steps": 7064, "loss": 0.812, "reward": null, "learning_rate": 3.257299970129336e-05, "epoch": 0.8, "percentage": 40.2, "elapsed_time": "7:58:12", "remaining_time": "11:51:15"} +{"current_steps": 2840, "total_steps": 7064, "loss": 0.812, "reward": null, "learning_rate": 3.257299970129336e-05, "epoch": 0.8, "percentage": 40.2, "elapsed_time": "7:58:11", "remaining_time": "11:51:13"} +{"current_steps": 2840, "total_steps": 7064, "loss": 0.812, "reward": null, "learning_rate": 3.257299970129336e-05, "epoch": 0.8, "percentage": 40.2, "elapsed_time": "8:02:05", "remaining_time": "11:57:00"} +{"current_steps": 2850, "total_steps": 7064, "loss": 0.809, "reward": null, "learning_rate": 3.246696578571592e-05, "epoch": 0.81, "percentage": 40.35, "elapsed_time": "7:59:55", "remaining_time": "11:49:36"} +{"current_steps": 2850, "total_steps": 7064, "loss": 0.809, "reward": null, "learning_rate": 3.246696578571592e-05, "epoch": 0.81, "percentage": 40.35, "elapsed_time": "7:59:53", "remaining_time": "11:49:34"} +{"current_steps": 2850, "total_steps": 7064, "loss": 0.809, "reward": null, "learning_rate": 3.246696578571592e-05, "epoch": 0.81, "percentage": 40.35, "elapsed_time": "7:59:53", "remaining_time": "11:49:33"} +{"current_steps": 2850, "total_steps": 7064, "loss": 0.809, "reward": null, "learning_rate": 3.246696578571592e-05, "epoch": 0.81, "percentage": 40.35, "elapsed_time": "8:03:46", "remaining_time": "11:55:18"} +{"current_steps": 2860, "total_steps": 7064, "loss": 0.8288, "reward": null, "learning_rate": 3.236078418329452e-05, "epoch": 0.81, "percentage": 40.49, "elapsed_time": "8:01:39", "remaining_time": "11:48:00"} +{"current_steps": 2860, "total_steps": 7064, "loss": 0.8288, "reward": null, "learning_rate": 3.236078418329452e-05, "epoch": 0.81, "percentage": 40.49, "elapsed_time": "8:01:38", "remaining_time": "11:47:58"} +{"current_steps": 2860, "total_steps": 7064, "loss": 0.8288, "reward": null, "learning_rate": 3.236078418329452e-05, "epoch": 0.81, "percentage": 40.49, "elapsed_time": "8:01:37", "remaining_time": "11:47:57"} +{"current_steps": 2860, "total_steps": 7064, "loss": 0.8288, "reward": null, "learning_rate": 3.236078418329452e-05, "epoch": 0.81, "percentage": 40.49, "elapsed_time": "8:05:30", "remaining_time": "11:53:40"} +{"current_steps": 2870, "total_steps": 7064, "loss": 0.808, "reward": null, "learning_rate": 3.225445699416276e-05, "epoch": 0.81, "percentage": 40.63, "elapsed_time": "8:07:15", "remaining_time": "11:52:02"} +{"current_steps": 2870, "total_steps": 7064, "loss": 0.808, "reward": null, "learning_rate": 3.225445699416276e-05, "epoch": 0.81, "percentage": 40.63, "elapsed_time": "8:03:24", "remaining_time": "11:46:24"} +{"current_steps": 2870, "total_steps": 7064, "loss": 0.808, "reward": null, "learning_rate": 3.225445699416276e-05, "epoch": 0.81, "percentage": 40.63, "elapsed_time": "8:03:23", "remaining_time": "11:46:23"} +{"current_steps": 2870, "total_steps": 7064, "loss": 0.808, "reward": null, "learning_rate": 3.225445699416276e-05, "epoch": 0.81, "percentage": 40.63, "elapsed_time": "8:03:22", "remaining_time": "11:46:22"} +{"current_steps": 2880, "total_steps": 7064, "loss": 0.8127, "reward": null, "learning_rate": 3.214798632133376e-05, "epoch": 0.82, "percentage": 40.77, "elapsed_time": "8:05:06", "remaining_time": "11:44:45"} +{"current_steps": 2880, "total_steps": 7064, "loss": 0.8127, "reward": null, "learning_rate": 3.214798632133376e-05, "epoch": 0.82, "percentage": 40.77, "elapsed_time": "8:08:57", "remaining_time": "11:50:21"} +{"current_steps": 2880, "total_steps": 7064, "loss": 0.8127, "reward": null, "learning_rate": 3.214798632133376e-05, "epoch": 0.82, "percentage": 40.77, "elapsed_time": "8:05:04", "remaining_time": "11:44:42"} +{"current_steps": 2880, "total_steps": 7064, "loss": 0.8127, "reward": null, "learning_rate": 3.214798632133376e-05, "epoch": 0.82, "percentage": 40.77, "elapsed_time": "8:05:05", "remaining_time": "11:44:43"} +{"current_steps": 2890, "total_steps": 7064, "loss": 0.8159, "reward": null, "learning_rate": 3.204137427065857e-05, "epoch": 0.82, "percentage": 40.91, "elapsed_time": "8:10:44", "remaining_time": "11:48:45"} +{"current_steps": 2890, "total_steps": 7064, "loss": 0.8159, "reward": null, "learning_rate": 3.204137427065857e-05, "epoch": 0.82, "percentage": 40.91, "elapsed_time": "8:06:52", "remaining_time": "11:43:11"} +{"current_steps": 2890, "total_steps": 7064, "loss": 0.8159, "reward": null, "learning_rate": 3.204137427065857e-05, "epoch": 0.82, "percentage": 40.91, "elapsed_time": "8:06:50", "remaining_time": "11:43:08"} +{"current_steps": 2890, "total_steps": 7064, "loss": 0.8159, "reward": null, "learning_rate": 3.204137427065857e-05, "epoch": 0.82, "percentage": 40.91, "elapsed_time": "8:06:51", "remaining_time": "11:43:10"} +{"current_steps": 2900, "total_steps": 7064, "loss": 0.819, "reward": null, "learning_rate": 3.193462295078448e-05, "epoch": 0.82, "percentage": 41.05, "elapsed_time": "8:12:29", "remaining_time": "11:47:08"} +{"current_steps": 2900, "total_steps": 7064, "loss": 0.819, "reward": null, "learning_rate": 3.193462295078448e-05, "epoch": 0.82, "percentage": 41.05, "elapsed_time": "8:08:37", "remaining_time": "11:41:35"} +{"current_steps": 2900, "total_steps": 7064, "loss": 0.819, "reward": null, "learning_rate": 3.193462295078448e-05, "epoch": 0.82, "percentage": 41.05, "elapsed_time": "8:08:38", "remaining_time": "11:41:36"} +{"current_steps": 2900, "total_steps": 7064, "loss": 0.819, "reward": null, "learning_rate": 3.193462295078448e-05, "epoch": 0.82, "percentage": 41.05, "elapsed_time": "8:08:36", "remaining_time": "11:41:33"} +{"current_steps": 2910, "total_steps": 7064, "loss": 0.8108, "reward": null, "learning_rate": 3.1827734473113356e-05, "epoch": 0.82, "percentage": 41.19, "elapsed_time": "8:10:20", "remaining_time": "11:39:58"} +{"current_steps": 2910, "total_steps": 7064, "loss": 0.8108, "reward": null, "learning_rate": 3.1827734473113356e-05, "epoch": 0.82, "percentage": 41.19, "elapsed_time": "8:10:19", "remaining_time": "11:39:56"} +{"current_steps": 2910, "total_steps": 7064, "loss": 0.8108, "reward": null, "learning_rate": 3.1827734473113356e-05, "epoch": 0.82, "percentage": 41.19, "elapsed_time": "8:10:18", "remaining_time": "11:39:55"} +{"current_steps": 2910, "total_steps": 7064, "loss": 0.8108, "reward": null, "learning_rate": 3.1827734473113356e-05, "epoch": 0.82, "percentage": 41.19, "elapsed_time": "8:14:12", "remaining_time": "11:45:28"} +{"current_steps": 2920, "total_steps": 7064, "loss": 0.8199, "reward": null, "learning_rate": 3.172071095175989e-05, "epoch": 0.83, "percentage": 41.34, "elapsed_time": "8:12:00", "remaining_time": "11:38:15"} +{"current_steps": 2920, "total_steps": 7064, "loss": 0.8199, "reward": null, "learning_rate": 3.172071095175989e-05, "epoch": 0.83, "percentage": 41.34, "elapsed_time": "8:15:53", "remaining_time": "11:43:46"} +{"current_steps": 2920, "total_steps": 7064, "loss": 0.8199, "reward": null, "learning_rate": 3.172071095175989e-05, "epoch": 0.83, "percentage": 41.34, "elapsed_time": "8:12:01", "remaining_time": "11:38:16"} +{"current_steps": 2920, "total_steps": 7064, "loss": 0.8199, "reward": null, "learning_rate": 3.172071095175989e-05, "epoch": 0.83, "percentage": 41.34, "elapsed_time": "8:12:02", "remaining_time": "11:38:17"} +{"current_steps": 2930, "total_steps": 7064, "loss": 0.7977, "reward": null, "learning_rate": 3.1613554503509715e-05, "epoch": 0.83, "percentage": 41.48, "elapsed_time": "8:13:44", "remaining_time": "11:36:37"} +{"current_steps": 2930, "total_steps": 7064, "loss": 0.7977, "reward": null, "learning_rate": 3.1613554503509715e-05, "epoch": 0.83, "percentage": 41.48, "elapsed_time": "8:17:35", "remaining_time": "11:42:03"} +{"current_steps": 2930, "total_steps": 7064, "loss": 0.7977, "reward": null, "learning_rate": 3.1613554503509715e-05, "epoch": 0.83, "percentage": 41.48, "elapsed_time": "8:13:43", "remaining_time": "11:36:36"} +{"current_steps": 2930, "total_steps": 7064, "loss": 0.7977, "reward": null, "learning_rate": 3.1613554503509715e-05, "epoch": 0.83, "percentage": 41.48, "elapsed_time": "8:13:42", "remaining_time": "11:36:34"} +{"current_steps": 2940, "total_steps": 7064, "loss": 0.8171, "reward": null, "learning_rate": 3.1506267247777645e-05, "epoch": 0.83, "percentage": 41.62, "elapsed_time": "8:15:26", "remaining_time": "11:34:57"} +{"current_steps": 2940, "total_steps": 7064, "loss": 0.8171, "reward": null, "learning_rate": 3.1506267247777645e-05, "epoch": 0.83, "percentage": 41.62, "elapsed_time": "8:15:27", "remaining_time": "11:34:59"} +{"current_steps": 2940, "total_steps": 7064, "loss": 0.8171, "reward": null, "learning_rate": 3.1506267247777645e-05, "epoch": 0.83, "percentage": 41.62, "elapsed_time": "8:15:28", "remaining_time": "11:35:00"} +{"current_steps": 2940, "total_steps": 7064, "loss": 0.8171, "reward": null, "learning_rate": 3.1506267247777645e-05, "epoch": 0.83, "percentage": 41.62, "elapsed_time": "8:19:19", "remaining_time": "11:40:24"} +{"current_steps": 2950, "total_steps": 7064, "loss": 0.8064, "reward": null, "learning_rate": 3.139885130656563e-05, "epoch": 0.84, "percentage": 41.76, "elapsed_time": "8:21:03", "remaining_time": "11:38:45"} +{"current_steps": 2950, "total_steps": 7064, "loss": 0.8064, "reward": null, "learning_rate": 3.139885130656563e-05, "epoch": 0.84, "percentage": 41.76, "elapsed_time": "8:17:11", "remaining_time": "11:33:21"} +{"current_steps": 2950, "total_steps": 7064, "loss": 0.8064, "reward": null, "learning_rate": 3.139885130656563e-05, "epoch": 0.84, "percentage": 41.76, "elapsed_time": "8:17:10", "remaining_time": "11:33:20"} +{"current_steps": 2950, "total_steps": 7064, "loss": 0.8064, "reward": null, "learning_rate": 3.139885130656563e-05, "epoch": 0.84, "percentage": 41.76, "elapsed_time": "8:17:12", "remaining_time": "11:33:23"} +{"current_steps": 2960, "total_steps": 7064, "loss": 0.8087, "reward": null, "learning_rate": 3.129130880442091e-05, "epoch": 0.84, "percentage": 41.9, "elapsed_time": "8:22:50", "remaining_time": "11:37:10"} +{"current_steps": 2960, "total_steps": 7064, "loss": 0.8087, "reward": null, "learning_rate": 3.129130880442091e-05, "epoch": 0.84, "percentage": 41.9, "elapsed_time": "8:18:57", "remaining_time": "11:31:48"} +{"current_steps": 2960, "total_steps": 7064, "loss": 0.8087, "reward": null, "learning_rate": 3.129130880442091e-05, "epoch": 0.84, "percentage": 41.9, "elapsed_time": "8:18:56", "remaining_time": "11:31:46"} +{"current_steps": 2960, "total_steps": 7064, "loss": 0.8087, "reward": null, "learning_rate": 3.129130880442091e-05, "epoch": 0.84, "percentage": 41.9, "elapsed_time": "8:18:58", "remaining_time": "11:31:49"} +{"current_steps": 2970, "total_steps": 7064, "loss": 0.8023, "reward": null, "learning_rate": 3.118364186839389e-05, "epoch": 0.84, "percentage": 42.04, "elapsed_time": "8:24:33", "remaining_time": "11:35:30"} +{"current_steps": 2970, "total_steps": 7064, "loss": 0.8023, "reward": null, "learning_rate": 3.118364186839389e-05, "epoch": 0.84, "percentage": 42.04, "elapsed_time": "8:20:40", "remaining_time": "11:30:08"} +{"current_steps": 2970, "total_steps": 7064, "loss": 0.8023, "reward": null, "learning_rate": 3.118364186839389e-05, "epoch": 0.84, "percentage": 42.04, "elapsed_time": "8:20:41", "remaining_time": "11:30:10"} +{"current_steps": 2970, "total_steps": 7064, "loss": 0.8023, "reward": null, "learning_rate": 3.118364186839389e-05, "epoch": 0.84, "percentage": 42.04, "elapsed_time": "8:20:42", "remaining_time": "11:30:11"} +{"current_steps": 2980, "total_steps": 7064, "loss": 0.7978, "reward": null, "learning_rate": 3.107585262799613e-05, "epoch": 0.84, "percentage": 42.19, "elapsed_time": "8:26:17", "remaining_time": "11:33:51"} +{"current_steps": 2980, "total_steps": 7064, "loss": 0.7978, "reward": null, "learning_rate": 3.107585262799613e-05, "epoch": 0.84, "percentage": 42.19, "elapsed_time": "8:22:24", "remaining_time": "11:28:31"} +{"current_steps": 2980, "total_steps": 7064, "loss": 0.7978, "reward": null, "learning_rate": 3.107585262799613e-05, "epoch": 0.84, "percentage": 42.19, "elapsed_time": "8:22:25", "remaining_time": "11:28:33"} +{"current_steps": 2980, "total_steps": 7064, "loss": 0.7978, "reward": null, "learning_rate": 3.107585262799613e-05, "epoch": 0.84, "percentage": 42.19, "elapsed_time": "8:22:26", "remaining_time": "11:28:34"} +{"current_steps": 2990, "total_steps": 7064, "loss": 0.8268, "reward": null, "learning_rate": 3.096794321515823e-05, "epoch": 0.85, "percentage": 42.33, "elapsed_time": "8:24:09", "remaining_time": "11:26:56"} +{"current_steps": 2990, "total_steps": 7064, "loss": 0.8268, "reward": null, "learning_rate": 3.096794321515823e-05, "epoch": 0.85, "percentage": 42.33, "elapsed_time": "8:24:08", "remaining_time": "11:26:55"} +{"current_steps": 2990, "total_steps": 7064, "loss": 0.8268, "reward": null, "learning_rate": 3.096794321515823e-05, "epoch": 0.85, "percentage": 42.33, "elapsed_time": "8:24:07", "remaining_time": "11:26:54"} +{"current_steps": 2990, "total_steps": 7064, "loss": 0.8268, "reward": null, "learning_rate": 3.096794321515823e-05, "epoch": 0.85, "percentage": 42.33, "elapsed_time": "8:28:01", "remaining_time": "11:32:12"} +{"current_steps": 3000, "total_steps": 7064, "loss": 0.8129, "reward": null, "learning_rate": 3.0859915764187616e-05, "epoch": 0.85, "percentage": 42.47, "elapsed_time": "8:25:55", "remaining_time": "11:25:21"} +{"current_steps": 3000, "total_steps": 7064, "loss": 0.8129, "reward": null, "learning_rate": 3.0859915764187616e-05, "epoch": 0.85, "percentage": 42.47, "elapsed_time": "8:29:46", "remaining_time": "11:30:34"} +{"current_steps": 3000, "total_steps": 7064, "loss": 0.8129, "reward": null, "learning_rate": 3.0859915764187616e-05, "epoch": 0.85, "percentage": 42.47, "elapsed_time": "8:25:54", "remaining_time": "11:25:19"} +{"current_steps": 3000, "total_steps": 7064, "loss": 0.8129, "reward": null, "learning_rate": 3.0859915764187616e-05, "epoch": 0.85, "percentage": 42.47, "elapsed_time": "8:25:53", "remaining_time": "11:25:18"} +{"current_steps": 3010, "total_steps": 7064, "loss": 0.8121, "reward": null, "learning_rate": 3.075177241172637e-05, "epoch": 0.85, "percentage": 42.61, "elapsed_time": "8:31:25", "remaining_time": "11:28:48"} +{"current_steps": 3010, "total_steps": 7064, "loss": 0.8121, "reward": null, "learning_rate": 3.075177241172637e-05, "epoch": 0.85, "percentage": 42.61, "elapsed_time": "8:27:34", "remaining_time": "11:23:37"} +{"current_steps": 3010, "total_steps": 7064, "loss": 0.8121, "reward": null, "learning_rate": 3.075177241172637e-05, "epoch": 0.85, "percentage": 42.61, "elapsed_time": "8:27:33", "remaining_time": "11:23:35"} +{"current_steps": 3010, "total_steps": 7064, "loss": 0.8121, "reward": null, "learning_rate": 3.075177241172637e-05, "epoch": 0.85, "percentage": 42.61, "elapsed_time": "8:27:32", "remaining_time": "11:23:34"} +{"current_steps": 3020, "total_steps": 7064, "loss": 0.8018, "reward": null, "learning_rate": 3.064351529670895e-05, "epoch": 0.86, "percentage": 42.75, "elapsed_time": "8:33:05", "remaining_time": "11:27:03"} +{"current_steps": 3020, "total_steps": 7064, "loss": 0.8018, "reward": null, "learning_rate": 3.064351529670895e-05, "epoch": 0.86, "percentage": 42.75, "elapsed_time": "8:29:12", "remaining_time": "11:21:52"} +{"current_steps": 3020, "total_steps": 7064, "loss": 0.8018, "reward": null, "learning_rate": 3.064351529670895e-05, "epoch": 0.86, "percentage": 42.75, "elapsed_time": "8:29:11", "remaining_time": "11:21:51"} +{"current_steps": 3020, "total_steps": 7064, "loss": 0.8018, "reward": null, "learning_rate": 3.064351529670895e-05, "epoch": 0.86, "percentage": 42.75, "elapsed_time": "8:29:13", "remaining_time": "11:21:53"} +{"current_steps": 3030, "total_steps": 7064, "loss": 0.8191, "reward": null, "learning_rate": 3.0535146560319895e-05, "epoch": 0.86, "percentage": 42.89, "elapsed_time": "8:30:53", "remaining_time": "11:20:10"} +{"current_steps": 3030, "total_steps": 7064, "loss": 0.8191, "reward": null, "learning_rate": 3.0535146560319895e-05, "epoch": 0.86, "percentage": 42.89, "elapsed_time": "8:34:44", "remaining_time": "11:25:18"} +{"current_steps": 3030, "total_steps": 7064, "loss": 0.8191, "reward": null, "learning_rate": 3.0535146560319895e-05, "epoch": 0.86, "percentage": 42.89, "elapsed_time": "8:30:52", "remaining_time": "11:20:08"} +{"current_steps": 3030, "total_steps": 7064, "loss": 0.8191, "reward": null, "learning_rate": 3.0535146560319895e-05, "epoch": 0.86, "percentage": 42.89, "elapsed_time": "8:30:51", "remaining_time": "11:20:07"} +{"current_steps": 3040, "total_steps": 7064, "loss": 0.813, "reward": null, "learning_rate": 3.0426668345951448e-05, "epoch": 0.86, "percentage": 43.04, "elapsed_time": "8:36:23", "remaining_time": "11:23:32"} +{"current_steps": 3040, "total_steps": 7064, "loss": 0.813, "reward": null, "learning_rate": 3.0426668345951448e-05, "epoch": 0.86, "percentage": 43.04, "elapsed_time": "8:32:30", "remaining_time": "11:18:23"} +{"current_steps": 3040, "total_steps": 7064, "loss": 0.813, "reward": null, "learning_rate": 3.0426668345951448e-05, "epoch": 0.86, "percentage": 43.04, "elapsed_time": "8:32:31", "remaining_time": "11:18:25"} +{"current_steps": 3040, "total_steps": 7064, "loss": 0.813, "reward": null, "learning_rate": 3.0426668345951448e-05, "epoch": 0.86, "percentage": 43.04, "elapsed_time": "8:32:32", "remaining_time": "11:18:26"} +{"current_steps": 3050, "total_steps": 7064, "loss": 0.8252, "reward": null, "learning_rate": 3.031808279916121e-05, "epoch": 0.86, "percentage": 43.18, "elapsed_time": "8:34:11", "remaining_time": "11:16:43"} +{"current_steps": 3050, "total_steps": 7064, "loss": 0.8252, "reward": null, "learning_rate": 3.031808279916121e-05, "epoch": 0.86, "percentage": 43.18, "elapsed_time": "8:34:10", "remaining_time": "11:16:41"} +{"current_steps": 3050, "total_steps": 7064, "loss": 0.8252, "reward": null, "learning_rate": 3.031808279916121e-05, "epoch": 0.86, "percentage": 43.18, "elapsed_time": "8:34:09", "remaining_time": "11:16:40"} +{"current_steps": 3050, "total_steps": 7064, "loss": 0.8252, "reward": null, "learning_rate": 3.031808279916121e-05, "epoch": 0.86, "percentage": 43.18, "elapsed_time": "8:38:03", "remaining_time": "11:21:47"} +{"current_steps": 3060, "total_steps": 7064, "loss": 0.7995, "reward": null, "learning_rate": 3.0209392067629676e-05, "epoch": 0.87, "percentage": 43.32, "elapsed_time": "8:39:47", "remaining_time": "11:20:08"} +{"current_steps": 3060, "total_steps": 7064, "loss": 0.7995, "reward": null, "learning_rate": 3.0209392067629676e-05, "epoch": 0.87, "percentage": 43.32, "elapsed_time": "8:35:56", "remaining_time": "11:15:06"} +{"current_steps": 3060, "total_steps": 7064, "loss": 0.7995, "reward": null, "learning_rate": 3.0209392067629676e-05, "epoch": 0.87, "percentage": 43.32, "elapsed_time": "8:35:54", "remaining_time": "11:15:03"} +{"current_steps": 3060, "total_steps": 7064, "loss": 0.7995, "reward": null, "learning_rate": 3.0209392067629676e-05, "epoch": 0.87, "percentage": 43.32, "elapsed_time": "8:35:55", "remaining_time": "11:15:04"} +{"current_steps": 3070, "total_steps": 7064, "loss": 0.8162, "reward": null, "learning_rate": 3.010059830111773e-05, "epoch": 0.87, "percentage": 43.46, "elapsed_time": "8:37:40", "remaining_time": "11:13:28"} +{"current_steps": 3070, "total_steps": 7064, "loss": 0.8162, "reward": null, "learning_rate": 3.010059830111773e-05, "epoch": 0.87, "percentage": 43.46, "elapsed_time": "8:41:31", "remaining_time": "11:18:29"} +{"current_steps": 3070, "total_steps": 7064, "loss": 0.8162, "reward": null, "learning_rate": 3.010059830111773e-05, "epoch": 0.87, "percentage": 43.46, "elapsed_time": "8:37:38", "remaining_time": "11:13:25"} +{"current_steps": 3070, "total_steps": 7064, "loss": 0.8162, "reward": null, "learning_rate": 3.010059830111773e-05, "epoch": 0.87, "percentage": 43.46, "elapsed_time": "8:37:39", "remaining_time": "11:13:27"} +{"current_steps": 3080, "total_steps": 7064, "loss": 0.8175, "reward": null, "learning_rate": 2.9991703651424184e-05, "epoch": 0.87, "percentage": 43.6, "elapsed_time": "8:39:23", "remaining_time": "11:11:50"} +{"current_steps": 3080, "total_steps": 7064, "loss": 0.8175, "reward": null, "learning_rate": 2.9991703651424184e-05, "epoch": 0.87, "percentage": 43.6, "elapsed_time": "8:39:22", "remaining_time": "11:11:49"} +{"current_steps": 3080, "total_steps": 7064, "loss": 0.8175, "reward": null, "learning_rate": 2.9991703651424184e-05, "epoch": 0.87, "percentage": 43.6, "elapsed_time": "8:39:21", "remaining_time": "11:11:48"} +{"current_steps": 3080, "total_steps": 7064, "loss": 0.8175, "reward": null, "learning_rate": 2.9991703651424184e-05, "epoch": 0.87, "percentage": 43.6, "elapsed_time": "8:43:15", "remaining_time": "11:16:49"} +{"current_steps": 3090, "total_steps": 7064, "loss": 0.8076, "reward": null, "learning_rate": 2.988271027234317e-05, "epoch": 0.87, "percentage": 43.74, "elapsed_time": "8:41:05", "remaining_time": "11:10:09"} +{"current_steps": 3090, "total_steps": 7064, "loss": 0.8076, "reward": null, "learning_rate": 2.988271027234317e-05, "epoch": 0.87, "percentage": 43.74, "elapsed_time": "8:41:03", "remaining_time": "11:10:08"} +{"current_steps": 3090, "total_steps": 7064, "loss": 0.8076, "reward": null, "learning_rate": 2.988271027234317e-05, "epoch": 0.87, "percentage": 43.74, "elapsed_time": "8:41:02", "remaining_time": "11:10:06"} +{"current_steps": 3090, "total_steps": 7064, "loss": 0.8076, "reward": null, "learning_rate": 2.988271027234317e-05, "epoch": 0.87, "percentage": 43.74, "elapsed_time": "8:44:56", "remaining_time": "11:15:06"} +{"current_steps": 3100, "total_steps": 7064, "loss": 0.8063, "reward": null, "learning_rate": 2.977362031962158e-05, "epoch": 0.88, "percentage": 43.88, "elapsed_time": "8:46:37", "remaining_time": "11:13:24"} +{"current_steps": 3100, "total_steps": 7064, "loss": 0.8063, "reward": null, "learning_rate": 2.977362031962158e-05, "epoch": 0.88, "percentage": 43.88, "elapsed_time": "8:42:44", "remaining_time": "11:08:26"} +{"current_steps": 3100, "total_steps": 7064, "loss": 0.8063, "reward": null, "learning_rate": 2.977362031962158e-05, "epoch": 0.88, "percentage": 43.88, "elapsed_time": "8:42:45", "remaining_time": "11:08:27"} +{"current_steps": 3100, "total_steps": 7064, "loss": 0.8063, "reward": null, "learning_rate": 2.977362031962158e-05, "epoch": 0.88, "percentage": 43.88, "elapsed_time": "8:42:46", "remaining_time": "11:08:28"} +{"current_steps": 3110, "total_steps": 7064, "loss": 0.8159, "reward": null, "learning_rate": 2.966443595091637e-05, "epoch": 0.88, "percentage": 44.03, "elapsed_time": "8:48:22", "remaining_time": "11:11:45"} +{"current_steps": 3110, "total_steps": 7064, "loss": 0.8159, "reward": null, "learning_rate": 2.966443595091637e-05, "epoch": 0.88, "percentage": 44.03, "elapsed_time": "8:44:30", "remaining_time": "11:06:51"} +{"current_steps": 3110, "total_steps": 7064, "loss": 0.8159, "reward": null, "learning_rate": 2.966443595091637e-05, "epoch": 0.88, "percentage": 44.03, "elapsed_time": "8:44:28", "remaining_time": "11:06:49"} +{"current_steps": 3110, "total_steps": 7064, "loss": 0.8159, "reward": null, "learning_rate": 2.966443595091637e-05, "epoch": 0.88, "percentage": 44.03, "elapsed_time": "8:44:29", "remaining_time": "11:06:50"} +{"current_steps": 3120, "total_steps": 7064, "loss": 0.8083, "reward": null, "learning_rate": 2.9555159325751947e-05, "epoch": 0.88, "percentage": 44.17, "elapsed_time": "8:46:12", "remaining_time": "11:05:10"} +{"current_steps": 3120, "total_steps": 7064, "loss": 0.8083, "reward": null, "learning_rate": 2.9555159325751947e-05, "epoch": 0.88, "percentage": 44.17, "elapsed_time": "8:50:03", "remaining_time": "11:10:03"} +{"current_steps": 3120, "total_steps": 7064, "loss": 0.8083, "reward": null, "learning_rate": 2.9555159325751947e-05, "epoch": 0.88, "percentage": 44.17, "elapsed_time": "8:46:11", "remaining_time": "11:05:09"} +{"current_steps": 3120, "total_steps": 7064, "loss": 0.8083, "reward": null, "learning_rate": 2.9555159325751947e-05, "epoch": 0.88, "percentage": 44.17, "elapsed_time": "8:46:10", "remaining_time": "11:05:08"} +{"current_steps": 3130, "total_steps": 7064, "loss": 0.807, "reward": null, "learning_rate": 2.9445792605477433e-05, "epoch": 0.89, "percentage": 44.31, "elapsed_time": "8:47:54", "remaining_time": "11:03:30"} +{"current_steps": 3130, "total_steps": 7064, "loss": 0.807, "reward": null, "learning_rate": 2.9445792605477433e-05, "epoch": 0.89, "percentage": 44.31, "elapsed_time": "8:51:45", "remaining_time": "11:08:21"} +{"current_steps": 3130, "total_steps": 7064, "loss": 0.807, "reward": null, "learning_rate": 2.9445792605477433e-05, "epoch": 0.89, "percentage": 44.31, "elapsed_time": "8:47:53", "remaining_time": "11:03:29"} +{"current_steps": 3130, "total_steps": 7064, "loss": 0.807, "reward": null, "learning_rate": 2.9445792605477433e-05, "epoch": 0.89, "percentage": 44.31, "elapsed_time": "8:47:52", "remaining_time": "11:03:27"} +{"current_steps": 3140, "total_steps": 7064, "loss": 0.8123, "reward": null, "learning_rate": 2.933633795322391e-05, "epoch": 0.89, "percentage": 44.45, "elapsed_time": "8:49:36", "remaining_time": "11:01:50"} +{"current_steps": 3140, "total_steps": 7064, "loss": 0.8123, "reward": null, "learning_rate": 2.933633795322391e-05, "epoch": 0.89, "percentage": 44.45, "elapsed_time": "8:49:35", "remaining_time": "11:01:49"} +{"current_steps": 3140, "total_steps": 7064, "loss": 0.8123, "reward": null, "learning_rate": 2.933633795322391e-05, "epoch": 0.89, "percentage": 44.45, "elapsed_time": "8:49:34", "remaining_time": "11:01:48"} +{"current_steps": 3140, "total_steps": 7064, "loss": 0.8123, "reward": null, "learning_rate": 2.933633795322391e-05, "epoch": 0.89, "percentage": 44.45, "elapsed_time": "8:53:28", "remaining_time": "11:06:40"} +{"current_steps": 3150, "total_steps": 7064, "loss": 0.8107, "reward": null, "learning_rate": 2.9226797533861615e-05, "epoch": 0.89, "percentage": 44.59, "elapsed_time": "8:51:18", "remaining_time": "11:00:10"} +{"current_steps": 3150, "total_steps": 7064, "loss": 0.8107, "reward": null, "learning_rate": 2.9226797533861615e-05, "epoch": 0.89, "percentage": 44.59, "elapsed_time": "8:55:09", "remaining_time": "11:04:57"} +{"current_steps": 3150, "total_steps": 7064, "loss": 0.8107, "reward": null, "learning_rate": 2.9226797533861615e-05, "epoch": 0.89, "percentage": 44.59, "elapsed_time": "8:51:16", "remaining_time": "11:00:07"} +{"current_steps": 3150, "total_steps": 7064, "loss": 0.8107, "reward": null, "learning_rate": 2.9226797533861615e-05, "epoch": 0.89, "percentage": 44.59, "elapsed_time": "8:51:17", "remaining_time": "11:00:08"} +{"current_steps": 3160, "total_steps": 7064, "loss": 0.8053, "reward": null, "learning_rate": 2.9117173513957186e-05, "epoch": 0.89, "percentage": 44.73, "elapsed_time": "8:56:53", "remaining_time": "11:03:17"} +{"current_steps": 3160, "total_steps": 7064, "loss": 0.8053, "reward": null, "learning_rate": 2.9117173513957186e-05, "epoch": 0.89, "percentage": 44.73, "elapsed_time": "8:53:00", "remaining_time": "10:58:30"} +{"current_steps": 3160, "total_steps": 7064, "loss": 0.8053, "reward": null, "learning_rate": 2.9117173513957186e-05, "epoch": 0.89, "percentage": 44.73, "elapsed_time": "8:53:01", "remaining_time": "10:58:31"} +{"current_steps": 3160, "total_steps": 7064, "loss": 0.8053, "reward": null, "learning_rate": 2.9117173513957186e-05, "epoch": 0.89, "percentage": 44.73, "elapsed_time": "8:52:59", "remaining_time": "10:58:29"} +{"current_steps": 3170, "total_steps": 7064, "loss": 0.8068, "reward": null, "learning_rate": 2.900746806173074e-05, "epoch": 0.9, "percentage": 44.88, "elapsed_time": "8:54:44", "remaining_time": "10:56:52"} +{"current_steps": 3170, "total_steps": 7064, "loss": 0.8068, "reward": null, "learning_rate": 2.900746806173074e-05, "epoch": 0.9, "percentage": 44.88, "elapsed_time": "8:54:43", "remaining_time": "10:56:51"} +{"current_steps": 3170, "total_steps": 7064, "loss": 0.8068, "reward": null, "learning_rate": 2.900746806173074e-05, "epoch": 0.9, "percentage": 44.88, "elapsed_time": "8:54:42", "remaining_time": "10:56:49"} +{"current_steps": 3170, "total_steps": 7064, "loss": 0.8068, "reward": null, "learning_rate": 2.900746806173074e-05, "epoch": 0.9, "percentage": 44.88, "elapsed_time": "8:58:35", "remaining_time": "11:01:36"} +{"current_steps": 3180, "total_steps": 7064, "loss": 0.8086, "reward": null, "learning_rate": 2.889768334701305e-05, "epoch": 0.9, "percentage": 45.02, "elapsed_time": "8:56:30", "remaining_time": "10:55:16"} +{"current_steps": 3180, "total_steps": 7064, "loss": 0.8086, "reward": null, "learning_rate": 2.889768334701305e-05, "epoch": 0.9, "percentage": 45.02, "elapsed_time": "9:00:21", "remaining_time": "10:59:59"} +{"current_steps": 3180, "total_steps": 7064, "loss": 0.8086, "reward": null, "learning_rate": 2.889768334701305e-05, "epoch": 0.9, "percentage": 45.02, "elapsed_time": "8:56:28", "remaining_time": "10:55:14"} +{"current_steps": 3180, "total_steps": 7064, "loss": 0.8086, "reward": null, "learning_rate": 2.889768334701305e-05, "epoch": 0.9, "percentage": 45.02, "elapsed_time": "8:56:29", "remaining_time": "10:55:15"} +{"current_steps": 3190, "total_steps": 7064, "loss": 0.8042, "reward": null, "learning_rate": 2.8787821541202564e-05, "epoch": 0.9, "percentage": 45.16, "elapsed_time": "9:02:04", "remaining_time": "10:58:17"} +{"current_steps": 3190, "total_steps": 7064, "loss": 0.8042, "reward": null, "learning_rate": 2.8787821541202564e-05, "epoch": 0.9, "percentage": 45.16, "elapsed_time": "8:58:12", "remaining_time": "10:53:36"} +{"current_steps": 3190, "total_steps": 7064, "loss": 0.8042, "reward": null, "learning_rate": 2.8787821541202564e-05, "epoch": 0.9, "percentage": 45.16, "elapsed_time": "8:58:10", "remaining_time": "10:53:34"} +{"current_steps": 3190, "total_steps": 7064, "loss": 0.8042, "reward": null, "learning_rate": 2.8787821541202564e-05, "epoch": 0.9, "percentage": 45.16, "elapsed_time": "8:58:11", "remaining_time": "10:53:35"} +{"current_steps": 3200, "total_steps": 7064, "loss": 0.8019, "reward": null, "learning_rate": 2.8677884817222505e-05, "epoch": 0.91, "percentage": 45.3, "elapsed_time": "8:59:51", "remaining_time": "10:51:52"} +{"current_steps": 3200, "total_steps": 7064, "loss": 0.8019, "reward": null, "learning_rate": 2.8677884817222505e-05, "epoch": 0.91, "percentage": 45.3, "elapsed_time": "9:03:42", "remaining_time": "10:56:32"} +{"current_steps": 3200, "total_steps": 7064, "loss": 0.8019, "reward": null, "learning_rate": 2.8677884817222505e-05, "epoch": 0.91, "percentage": 45.3, "elapsed_time": "8:59:50", "remaining_time": "10:51:51"} +{"current_steps": 3200, "total_steps": 7064, "loss": 0.8019, "reward": null, "learning_rate": 2.8677884817222505e-05, "epoch": 0.91, "percentage": 45.3, "elapsed_time": "8:59:49", "remaining_time": "10:51:50"} +{"current_steps": 3210, "total_steps": 7064, "loss": 0.8117, "reward": null, "learning_rate": 2.856787534947789e-05, "epoch": 0.91, "percentage": 45.44, "elapsed_time": "9:05:25", "remaining_time": "10:54:50"} +{"current_steps": 3210, "total_steps": 7064, "loss": 0.8117, "reward": null, "learning_rate": 2.856787534947789e-05, "epoch": 0.91, "percentage": 45.44, "elapsed_time": "9:01:31", "remaining_time": "10:50:10"} +{"current_steps": 3210, "total_steps": 7064, "loss": 0.8117, "reward": null, "learning_rate": 2.856787534947789e-05, "epoch": 0.91, "percentage": 45.44, "elapsed_time": "9:01:32", "remaining_time": "10:50:11"} +{"current_steps": 3210, "total_steps": 7064, "loss": 0.8117, "reward": null, "learning_rate": 2.856787534947789e-05, "epoch": 0.91, "percentage": 45.44, "elapsed_time": "9:01:33", "remaining_time": "10:50:12"} +{"current_steps": 3220, "total_steps": 7064, "loss": 0.8243, "reward": null, "learning_rate": 2.8457795313812507e-05, "epoch": 0.91, "percentage": 45.58, "elapsed_time": "9:03:16", "remaining_time": "10:48:33"} +{"current_steps": 3220, "total_steps": 7064, "loss": 0.8243, "reward": null, "learning_rate": 2.8457795313812507e-05, "epoch": 0.91, "percentage": 45.58, "elapsed_time": "9:03:15", "remaining_time": "10:48:32"} +{"current_steps": 3220, "total_steps": 7064, "loss": 0.8243, "reward": null, "learning_rate": 2.8457795313812507e-05, "epoch": 0.91, "percentage": 45.58, "elapsed_time": "9:03:14", "remaining_time": "10:48:31"} +{"current_steps": 3220, "total_steps": 7064, "loss": 0.8243, "reward": null, "learning_rate": 2.8457795313812507e-05, "epoch": 0.91, "percentage": 45.58, "elapsed_time": "9:07:08", "remaining_time": "10:53:09"} +{"current_steps": 3230, "total_steps": 7064, "loss": 0.7953, "reward": null, "learning_rate": 2.8347646887465867e-05, "epoch": 0.91, "percentage": 45.72, "elapsed_time": "9:04:59", "remaining_time": "10:46:53"} +{"current_steps": 3230, "total_steps": 7064, "loss": 0.7953, "reward": null, "learning_rate": 2.8347646887465867e-05, "epoch": 0.91, "percentage": 45.72, "elapsed_time": "9:04:57", "remaining_time": "10:46:51"} +{"current_steps": 3230, "total_steps": 7064, "loss": 0.7953, "reward": null, "learning_rate": 2.8347646887465867e-05, "epoch": 0.91, "percentage": 45.72, "elapsed_time": "9:04:57", "remaining_time": "10:46:52"} +{"current_steps": 3230, "total_steps": 7064, "loss": 0.7953, "reward": null, "learning_rate": 2.8347646887465867e-05, "epoch": 0.91, "percentage": 45.72, "elapsed_time": "9:08:50", "remaining_time": "10:51:28"} +{"current_steps": 3240, "total_steps": 7064, "loss": 0.8042, "reward": null, "learning_rate": 2.8237432249030183e-05, "epoch": 0.92, "percentage": 45.87, "elapsed_time": "9:06:41", "remaining_time": "10:45:13"} +{"current_steps": 3240, "total_steps": 7064, "loss": 0.8042, "reward": null, "learning_rate": 2.8237432249030183e-05, "epoch": 0.92, "percentage": 45.87, "elapsed_time": "9:10:32", "remaining_time": "10:49:46"} +{"current_steps": 3240, "total_steps": 7064, "loss": 0.8042, "reward": null, "learning_rate": 2.8237432249030183e-05, "epoch": 0.92, "percentage": 45.87, "elapsed_time": "9:06:39", "remaining_time": "10:45:11"} +{"current_steps": 3240, "total_steps": 7064, "loss": 0.8042, "reward": null, "learning_rate": 2.8237432249030183e-05, "epoch": 0.92, "percentage": 45.87, "elapsed_time": "9:06:40", "remaining_time": "10:45:12"} +{"current_steps": 3250, "total_steps": 7064, "loss": 0.799, "reward": null, "learning_rate": 2.812715357840725e-05, "epoch": 0.92, "percentage": 46.01, "elapsed_time": "9:08:23", "remaining_time": "10:43:33"} +{"current_steps": 3250, "total_steps": 7064, "loss": 0.799, "reward": null, "learning_rate": 2.812715357840725e-05, "epoch": 0.92, "percentage": 46.01, "elapsed_time": "9:12:16", "remaining_time": "10:48:06"} +{"current_steps": 3250, "total_steps": 7064, "loss": 0.799, "reward": null, "learning_rate": 2.812715357840725e-05, "epoch": 0.92, "percentage": 46.01, "elapsed_time": "9:08:22", "remaining_time": "10:43:32"} +{"current_steps": 3250, "total_steps": 7064, "loss": 0.799, "reward": null, "learning_rate": 2.812715357840725e-05, "epoch": 0.92, "percentage": 46.01, "elapsed_time": "9:08:24", "remaining_time": "10:43:35"} +{"current_steps": 3260, "total_steps": 7064, "loss": 0.8093, "reward": null, "learning_rate": 2.801681305676534e-05, "epoch": 0.92, "percentage": 46.15, "elapsed_time": "9:10:09", "remaining_time": "10:41:58"} +{"current_steps": 3260, "total_steps": 7064, "loss": 0.8093, "reward": null, "learning_rate": 2.801681305676534e-05, "epoch": 0.92, "percentage": 46.15, "elapsed_time": "9:10:08", "remaining_time": "10:41:56"} +{"current_steps": 3260, "total_steps": 7064, "loss": 0.8093, "reward": null, "learning_rate": 2.801681305676534e-05, "epoch": 0.92, "percentage": 46.15, "elapsed_time": "9:10:07", "remaining_time": "10:41:55"} +{"current_steps": 3260, "total_steps": 7064, "loss": 0.8093, "reward": null, "learning_rate": 2.801681305676534e-05, "epoch": 0.92, "percentage": 46.15, "elapsed_time": "9:14:01", "remaining_time": "10:46:28"} +{"current_steps": 3270, "total_steps": 7064, "loss": 0.8048, "reward": null, "learning_rate": 2.7906412866496034e-05, "epoch": 0.93, "percentage": 46.29, "elapsed_time": "9:11:54", "remaining_time": "10:40:20"} +{"current_steps": 3270, "total_steps": 7064, "loss": 0.8048, "reward": null, "learning_rate": 2.7906412866496034e-05, "epoch": 0.93, "percentage": 46.29, "elapsed_time": "9:15:45", "remaining_time": "10:44:48"} +{"current_steps": 3270, "total_steps": 7064, "loss": 0.8048, "reward": null, "learning_rate": 2.7906412866496034e-05, "epoch": 0.93, "percentage": 46.29, "elapsed_time": "9:11:52", "remaining_time": "10:40:18"} +{"current_steps": 3270, "total_steps": 7064, "loss": 0.8048, "reward": null, "learning_rate": 2.7906412866496034e-05, "epoch": 0.93, "percentage": 46.29, "elapsed_time": "9:11:53", "remaining_time": "10:40:19"} +{"current_steps": 3280, "total_steps": 7064, "loss": 0.8116, "reward": null, "learning_rate": 2.7795955191171114e-05, "epoch": 0.93, "percentage": 46.43, "elapsed_time": "9:17:29", "remaining_time": "10:43:09"} +{"current_steps": 3280, "total_steps": 7064, "loss": 0.8116, "reward": null, "learning_rate": 2.7795955191171114e-05, "epoch": 0.93, "percentage": 46.43, "elapsed_time": "9:13:38", "remaining_time": "10:38:42"} +{"current_steps": 3280, "total_steps": 7064, "loss": 0.8116, "reward": null, "learning_rate": 2.7795955191171114e-05, "epoch": 0.93, "percentage": 46.43, "elapsed_time": "9:13:37", "remaining_time": "10:38:41"} +{"current_steps": 3280, "total_steps": 7064, "loss": 0.8116, "reward": null, "learning_rate": 2.7795955191171114e-05, "epoch": 0.93, "percentage": 46.43, "elapsed_time": "9:13:36", "remaining_time": "10:38:40"} +{"current_steps": 3290, "total_steps": 7064, "loss": 0.8151, "reward": null, "learning_rate": 2.7685442215499323e-05, "epoch": 0.93, "percentage": 46.57, "elapsed_time": "9:19:11", "remaining_time": "10:41:27"} +{"current_steps": 3290, "total_steps": 7064, "loss": 0.8151, "reward": null, "learning_rate": 2.7685442215499323e-05, "epoch": 0.93, "percentage": 46.57, "elapsed_time": "9:15:20", "remaining_time": "10:37:02"} +{"current_steps": 3290, "total_steps": 7064, "loss": 0.8151, "reward": null, "learning_rate": 2.7685442215499323e-05, "epoch": 0.93, "percentage": 46.57, "elapsed_time": "9:15:19", "remaining_time": "10:37:01"} +{"current_steps": 3290, "total_steps": 7064, "loss": 0.8151, "reward": null, "learning_rate": 2.7685442215499323e-05, "epoch": 0.93, "percentage": 46.57, "elapsed_time": "9:15:18", "remaining_time": "10:36:59"} +{"current_steps": 3300, "total_steps": 7064, "loss": 0.8017, "reward": null, "learning_rate": 2.7574876125283176e-05, "epoch": 0.93, "percentage": 46.72, "elapsed_time": "9:20:56", "remaining_time": "10:39:48"} +{"current_steps": 3300, "total_steps": 7064, "loss": 0.8017, "reward": null, "learning_rate": 2.7574876125283176e-05, "epoch": 0.93, "percentage": 46.72, "elapsed_time": "9:17:03", "remaining_time": "10:35:22"} +{"current_steps": 3300, "total_steps": 7064, "loss": 0.8017, "reward": null, "learning_rate": 2.7574876125283176e-05, "epoch": 0.93, "percentage": 46.72, "elapsed_time": "9:17:03", "remaining_time": "10:35:23"} +{"current_steps": 3300, "total_steps": 7064, "loss": 0.8017, "reward": null, "learning_rate": 2.7574876125283176e-05, "epoch": 0.93, "percentage": 46.72, "elapsed_time": "9:17:05", "remaining_time": "10:35:24"} +{"current_steps": 3310, "total_steps": 7064, "loss": 0.8051, "reward": null, "learning_rate": 2.7464259107375722e-05, "epoch": 0.94, "percentage": 46.86, "elapsed_time": "9:18:45", "remaining_time": "10:33:42"} +{"current_steps": 3310, "total_steps": 7064, "loss": 0.8051, "reward": null, "learning_rate": 2.7464259107375722e-05, "epoch": 0.94, "percentage": 46.86, "elapsed_time": "9:22:36", "remaining_time": "10:38:05"} +{"current_steps": 3310, "total_steps": 7064, "loss": 0.8051, "reward": null, "learning_rate": 2.7464259107375722e-05, "epoch": 0.94, "percentage": 46.86, "elapsed_time": "9:18:44", "remaining_time": "10:33:41"} +{"current_steps": 3310, "total_steps": 7064, "loss": 0.8051, "reward": null, "learning_rate": 2.7464259107375722e-05, "epoch": 0.94, "percentage": 46.86, "elapsed_time": "9:18:43", "remaining_time": "10:33:40"} +{"current_steps": 3320, "total_steps": 7064, "loss": 0.803, "reward": null, "learning_rate": 2.7353593349637297e-05, "epoch": 0.94, "percentage": 47.0, "elapsed_time": "9:20:30", "remaining_time": "10:32:06"} +{"current_steps": 3320, "total_steps": 7064, "loss": 0.803, "reward": null, "learning_rate": 2.7353593349637297e-05, "epoch": 0.94, "percentage": 47.0, "elapsed_time": "9:24:22", "remaining_time": "10:36:26"} +{"current_steps": 3320, "total_steps": 7064, "loss": 0.803, "reward": null, "learning_rate": 2.7353593349637297e-05, "epoch": 0.94, "percentage": 47.0, "elapsed_time": "9:20:28", "remaining_time": "10:32:03"} +{"current_steps": 3320, "total_steps": 7064, "loss": 0.803, "reward": null, "learning_rate": 2.7353593349637297e-05, "epoch": 0.94, "percentage": 47.0, "elapsed_time": "9:20:29", "remaining_time": "10:32:04"} +{"current_steps": 3330, "total_steps": 7064, "loss": 0.8094, "reward": null, "learning_rate": 2.7242881040892255e-05, "epoch": 0.94, "percentage": 47.14, "elapsed_time": "9:26:01", "remaining_time": "10:34:41"} +{"current_steps": 3330, "total_steps": 7064, "loss": 0.8094, "reward": null, "learning_rate": 2.7242881040892255e-05, "epoch": 0.94, "percentage": 47.14, "elapsed_time": "9:22:09", "remaining_time": "10:30:21"} +{"current_steps": 3330, "total_steps": 7064, "loss": 0.8094, "reward": null, "learning_rate": 2.7242881040892255e-05, "epoch": 0.94, "percentage": 47.14, "elapsed_time": "9:22:08", "remaining_time": "10:30:20"} +{"current_steps": 3330, "total_steps": 7064, "loss": 0.8094, "reward": null, "learning_rate": 2.7242881040892255e-05, "epoch": 0.94, "percentage": 47.14, "elapsed_time": "9:22:07", "remaining_time": "10:30:19"} +{"current_steps": 3340, "total_steps": 7064, "loss": 0.8186, "reward": null, "learning_rate": 2.713212437088564e-05, "epoch": 0.95, "percentage": 47.28, "elapsed_time": "9:27:45", "remaining_time": "10:33:02"} +{"current_steps": 3340, "total_steps": 7064, "loss": 0.8186, "reward": null, "learning_rate": 2.713212437088564e-05, "epoch": 0.95, "percentage": 47.28, "elapsed_time": "9:23:54", "remaining_time": "10:28:44"} +{"current_steps": 3340, "total_steps": 7064, "loss": 0.8186, "reward": null, "learning_rate": 2.713212437088564e-05, "epoch": 0.95, "percentage": 47.28, "elapsed_time": "9:23:53", "remaining_time": "10:28:43"} +{"current_steps": 3340, "total_steps": 7064, "loss": 0.8186, "reward": null, "learning_rate": 2.713212437088564e-05, "epoch": 0.95, "percentage": 47.28, "elapsed_time": "9:23:52", "remaining_time": "10:28:42"} +{"current_steps": 3350, "total_steps": 7064, "loss": 0.8041, "reward": null, "learning_rate": 2.702132553023993e-05, "epoch": 0.95, "percentage": 47.42, "elapsed_time": "9:29:26", "remaining_time": "10:31:19"} +{"current_steps": 3350, "total_steps": 7064, "loss": 0.8041, "reward": null, "learning_rate": 2.702132553023993e-05, "epoch": 0.95, "percentage": 47.42, "elapsed_time": "9:25:33", "remaining_time": "10:27:00"} +{"current_steps": 3350, "total_steps": 7064, "loss": 0.8041, "reward": null, "learning_rate": 2.702132553023993e-05, "epoch": 0.95, "percentage": 47.42, "elapsed_time": "9:25:35", "remaining_time": "10:27:02"} +{"current_steps": 3350, "total_steps": 7064, "loss": 0.8041, "reward": null, "learning_rate": 2.702132553023993e-05, "epoch": 0.95, "percentage": 47.42, "elapsed_time": "9:25:34", "remaining_time": "10:27:01"} +{"current_steps": 3360, "total_steps": 7064, "loss": 0.8009, "reward": null, "learning_rate": 2.691048671041169e-05, "epoch": 0.95, "percentage": 47.57, "elapsed_time": "9:27:19", "remaining_time": "10:25:23"} +{"current_steps": 3360, "total_steps": 7064, "loss": 0.8009, "reward": null, "learning_rate": 2.691048671041169e-05, "epoch": 0.95, "percentage": 47.57, "elapsed_time": "9:27:17", "remaining_time": "10:25:22"} +{"current_steps": 3360, "total_steps": 7064, "loss": 0.8009, "reward": null, "learning_rate": 2.691048671041169e-05, "epoch": 0.95, "percentage": 47.57, "elapsed_time": "9:27:17", "remaining_time": "10:25:21"} +{"current_steps": 3360, "total_steps": 7064, "loss": 0.8009, "reward": null, "learning_rate": 2.691048671041169e-05, "epoch": 0.95, "percentage": 47.57, "elapsed_time": "9:31:10", "remaining_time": "10:29:38"} +{"current_steps": 3370, "total_steps": 7064, "loss": 0.7931, "reward": null, "learning_rate": 2.6799610103648197e-05, "epoch": 0.95, "percentage": 47.71, "elapsed_time": "9:29:02", "remaining_time": "10:23:45"} +{"current_steps": 3370, "total_steps": 7064, "loss": 0.7931, "reward": null, "learning_rate": 2.6799610103648197e-05, "epoch": 0.95, "percentage": 47.71, "elapsed_time": "9:32:53", "remaining_time": "10:27:58"} +{"current_steps": 3370, "total_steps": 7064, "loss": 0.7931, "reward": null, "learning_rate": 2.6799610103648197e-05, "epoch": 0.95, "percentage": 47.71, "elapsed_time": "9:29:01", "remaining_time": "10:23:43"} +{"current_steps": 3370, "total_steps": 7064, "loss": 0.7931, "reward": null, "learning_rate": 2.6799610103648197e-05, "epoch": 0.95, "percentage": 47.71, "elapsed_time": "9:29:00", "remaining_time": "10:23:42"} +{"current_steps": 3380, "total_steps": 7064, "loss": 0.8001, "reward": null, "learning_rate": 2.668869790294411e-05, "epoch": 0.96, "percentage": 47.85, "elapsed_time": "9:34:37", "remaining_time": "10:26:18"} +{"current_steps": 3380, "total_steps": 7064, "loss": 0.8001, "reward": null, "learning_rate": 2.668869790294411e-05, "epoch": 0.96, "percentage": 47.85, "elapsed_time": "9:30:45", "remaining_time": "10:22:06"} +{"current_steps": 3380, "total_steps": 7064, "loss": 0.8001, "reward": null, "learning_rate": 2.668869790294411e-05, "epoch": 0.96, "percentage": 47.85, "elapsed_time": "9:30:43", "remaining_time": "10:22:03"} +{"current_steps": 3380, "total_steps": 7064, "loss": 0.8001, "reward": null, "learning_rate": 2.668869790294411e-05, "epoch": 0.96, "percentage": 47.85, "elapsed_time": "9:30:44", "remaining_time": "10:22:04"} +{"current_steps": 3390, "total_steps": 7064, "loss": 0.8167, "reward": null, "learning_rate": 2.6577752301998098e-05, "epoch": 0.96, "percentage": 47.99, "elapsed_time": "9:32:28", "remaining_time": "10:20:26"} +{"current_steps": 3390, "total_steps": 7064, "loss": 0.8167, "reward": null, "learning_rate": 2.6577752301998098e-05, "epoch": 0.96, "percentage": 47.99, "elapsed_time": "9:36:20", "remaining_time": "10:24:37"} +{"current_steps": 3390, "total_steps": 7064, "loss": 0.8167, "reward": null, "learning_rate": 2.6577752301998098e-05, "epoch": 0.96, "percentage": 47.99, "elapsed_time": "9:32:26", "remaining_time": "10:20:24"} +{"current_steps": 3390, "total_steps": 7064, "loss": 0.8167, "reward": null, "learning_rate": 2.6577752301998098e-05, "epoch": 0.96, "percentage": 47.99, "elapsed_time": "9:32:27", "remaining_time": "10:20:25"} +{"current_steps": 3400, "total_steps": 7064, "loss": 0.8114, "reward": null, "learning_rate": 2.6466775495169437e-05, "epoch": 0.96, "percentage": 48.13, "elapsed_time": "9:34:09", "remaining_time": "10:18:44"} +{"current_steps": 3400, "total_steps": 7064, "loss": 0.8114, "reward": null, "learning_rate": 2.6466775495169437e-05, "epoch": 0.96, "percentage": 48.13, "elapsed_time": "9:34:08", "remaining_time": "10:18:43"} +{"current_steps": 3400, "total_steps": 7064, "loss": 0.8114, "reward": null, "learning_rate": 2.6466775495169437e-05, "epoch": 0.96, "percentage": 48.13, "elapsed_time": "9:34:07", "remaining_time": "10:18:42"} +{"current_steps": 3400, "total_steps": 7064, "loss": 0.8114, "reward": null, "learning_rate": 2.6466775495169437e-05, "epoch": 0.96, "percentage": 48.13, "elapsed_time": "9:38:01", "remaining_time": "10:22:53"} +{"current_steps": 3410, "total_steps": 7064, "loss": 0.8026, "reward": null, "learning_rate": 2.6355769677434628e-05, "epoch": 0.97, "percentage": 48.27, "elapsed_time": "9:35:50", "remaining_time": "10:17:02"} +{"current_steps": 3410, "total_steps": 7064, "loss": 0.8026, "reward": null, "learning_rate": 2.6355769677434628e-05, "epoch": 0.97, "percentage": 48.27, "elapsed_time": "9:39:41", "remaining_time": "10:21:10"} +{"current_steps": 3410, "total_steps": 7064, "loss": 0.8026, "reward": null, "learning_rate": 2.6355769677434628e-05, "epoch": 0.97, "percentage": 48.27, "elapsed_time": "9:35:49", "remaining_time": "10:17:01"} +{"current_steps": 3410, "total_steps": 7064, "loss": 0.8026, "reward": null, "learning_rate": 2.6355769677434628e-05, "epoch": 0.97, "percentage": 48.27, "elapsed_time": "9:35:48", "remaining_time": "10:17:00"} +{"current_steps": 3420, "total_steps": 7064, "loss": 0.8063, "reward": null, "learning_rate": 2.6244737044343954e-05, "epoch": 0.97, "percentage": 48.41, "elapsed_time": "9:37:32", "remaining_time": "10:15:21"} +{"current_steps": 3420, "total_steps": 7064, "loss": 0.8063, "reward": null, "learning_rate": 2.6244737044343954e-05, "epoch": 0.97, "percentage": 48.41, "elapsed_time": "9:37:30", "remaining_time": "10:15:19"} +{"current_steps": 3420, "total_steps": 7064, "loss": 0.8063, "reward": null, "learning_rate": 2.6244737044343954e-05, "epoch": 0.97, "percentage": 48.41, "elapsed_time": "9:37:31", "remaining_time": "10:15:20"} +{"current_steps": 3420, "total_steps": 7064, "loss": 0.8063, "reward": null, "learning_rate": 2.6244737044343954e-05, "epoch": 0.97, "percentage": 48.41, "elapsed_time": "9:41:23", "remaining_time": "10:19:28"} +{"current_steps": 3430, "total_steps": 7064, "loss": 0.8087, "reward": null, "learning_rate": 2.6133679791978065e-05, "epoch": 0.97, "percentage": 48.56, "elapsed_time": "9:39:12", "remaining_time": "10:13:39"} +{"current_steps": 3430, "total_steps": 7064, "loss": 0.8087, "reward": null, "learning_rate": 2.6133679791978065e-05, "epoch": 0.97, "percentage": 48.56, "elapsed_time": "9:43:03", "remaining_time": "10:17:44"} +{"current_steps": 3430, "total_steps": 7064, "loss": 0.8087, "reward": null, "learning_rate": 2.6133679791978065e-05, "epoch": 0.97, "percentage": 48.56, "elapsed_time": "9:39:10", "remaining_time": "10:13:37"} +{"current_steps": 3430, "total_steps": 7064, "loss": 0.8087, "reward": null, "learning_rate": 2.6133679791978065e-05, "epoch": 0.97, "percentage": 48.56, "elapsed_time": "9:39:11", "remaining_time": "10:13:38"} +{"current_steps": 3440, "total_steps": 7064, "loss": 0.812, "reward": null, "learning_rate": 2.602260011690457e-05, "epoch": 0.97, "percentage": 48.7, "elapsed_time": "9:40:53", "remaining_time": "10:11:57"} +{"current_steps": 3440, "total_steps": 7064, "loss": 0.812, "reward": null, "learning_rate": 2.602260011690457e-05, "epoch": 0.97, "percentage": 48.7, "elapsed_time": "9:40:52", "remaining_time": "10:11:56"} +{"current_steps": 3440, "total_steps": 7064, "loss": 0.812, "reward": null, "learning_rate": 2.602260011690457e-05, "epoch": 0.97, "percentage": 48.7, "elapsed_time": "9:40:51", "remaining_time": "10:11:55"} +{"current_steps": 3440, "total_steps": 7064, "loss": 0.812, "reward": null, "learning_rate": 2.602260011690457e-05, "epoch": 0.97, "percentage": 48.7, "elapsed_time": "9:44:44", "remaining_time": "10:16:01"} +{"current_steps": 3450, "total_steps": 7064, "loss": 0.7899, "reward": null, "learning_rate": 2.591150021613456e-05, "epoch": 0.98, "percentage": 48.84, "elapsed_time": "9:42:36", "remaining_time": "10:10:17"} +{"current_steps": 3450, "total_steps": 7064, "loss": 0.7899, "reward": null, "learning_rate": 2.591150021613456e-05, "epoch": 0.98, "percentage": 48.84, "elapsed_time": "9:46:27", "remaining_time": "10:14:20"} +{"current_steps": 3450, "total_steps": 7064, "loss": 0.7899, "reward": null, "learning_rate": 2.591150021613456e-05, "epoch": 0.98, "percentage": 48.84, "elapsed_time": "9:42:34", "remaining_time": "10:10:15"} +{"current_steps": 3450, "total_steps": 7064, "loss": 0.7899, "reward": null, "learning_rate": 2.591150021613456e-05, "epoch": 0.98, "percentage": 48.84, "elapsed_time": "9:42:34", "remaining_time": "10:10:16"} +{"current_steps": 3460, "total_steps": 7064, "loss": 0.798, "reward": null, "learning_rate": 2.580038228707916e-05, "epoch": 0.98, "percentage": 48.98, "elapsed_time": "9:48:08", "remaining_time": "10:12:37"} +{"current_steps": 3460, "total_steps": 7064, "loss": 0.798, "reward": null, "learning_rate": 2.580038228707916e-05, "epoch": 0.98, "percentage": 48.98, "elapsed_time": "9:44:16", "remaining_time": "10:08:35"} +{"current_steps": 3460, "total_steps": 7064, "loss": 0.798, "reward": null, "learning_rate": 2.580038228707916e-05, "epoch": 0.98, "percentage": 48.98, "elapsed_time": "9:44:17", "remaining_time": "10:08:36"} +{"current_steps": 3460, "total_steps": 7064, "loss": 0.798, "reward": null, "learning_rate": 2.580038228707916e-05, "epoch": 0.98, "percentage": 48.98, "elapsed_time": "9:44:15", "remaining_time": "10:08:34"} +{"current_steps": 3470, "total_steps": 7064, "loss": 0.826, "reward": null, "learning_rate": 2.568924852750607e-05, "epoch": 0.98, "percentage": 49.12, "elapsed_time": "9:45:56", "remaining_time": "10:06:52"} +{"current_steps": 3470, "total_steps": 7064, "loss": 0.826, "reward": null, "learning_rate": 2.568924852750607e-05, "epoch": 0.98, "percentage": 49.12, "elapsed_time": "9:49:47", "remaining_time": "10:10:52"} +{"current_steps": 3470, "total_steps": 7064, "loss": 0.826, "reward": null, "learning_rate": 2.568924852750607e-05, "epoch": 0.98, "percentage": 49.12, "elapsed_time": "9:45:55", "remaining_time": "10:06:51"} +{"current_steps": 3470, "total_steps": 7064, "loss": 0.826, "reward": null, "learning_rate": 2.568924852750607e-05, "epoch": 0.98, "percentage": 49.12, "elapsed_time": "9:45:54", "remaining_time": "10:06:50"} +{"current_steps": 3480, "total_steps": 7064, "loss": 0.8111, "reward": null, "learning_rate": 2.55781011354961e-05, "epoch": 0.99, "percentage": 49.26, "elapsed_time": "9:47:40", "remaining_time": "10:05:14"} +{"current_steps": 3480, "total_steps": 7064, "loss": 0.8111, "reward": null, "learning_rate": 2.55781011354961e-05, "epoch": 0.99, "percentage": 49.26, "elapsed_time": "9:51:31", "remaining_time": "10:09:12"} +{"current_steps": 3480, "total_steps": 7064, "loss": 0.8111, "reward": null, "learning_rate": 2.55781011354961e-05, "epoch": 0.99, "percentage": 49.26, "elapsed_time": "9:47:39", "remaining_time": "10:05:13"} +{"current_steps": 3480, "total_steps": 7064, "loss": 0.8111, "reward": null, "learning_rate": 2.55781011354961e-05, "epoch": 0.99, "percentage": 49.26, "elapsed_time": "9:47:38", "remaining_time": "10:05:12"} +{"current_steps": 3490, "total_steps": 7064, "loss": 0.7924, "reward": null, "learning_rate": 2.5466942309399706e-05, "epoch": 0.99, "percentage": 49.41, "elapsed_time": "9:49:25", "remaining_time": "10:03:37"} +{"current_steps": 3490, "total_steps": 7064, "loss": 0.7924, "reward": null, "learning_rate": 2.5466942309399706e-05, "epoch": 0.99, "percentage": 49.41, "elapsed_time": "9:53:17", "remaining_time": "10:07:34"} +{"current_steps": 3490, "total_steps": 7064, "loss": 0.7924, "reward": null, "learning_rate": 2.5466942309399706e-05, "epoch": 0.99, "percentage": 49.41, "elapsed_time": "9:49:24", "remaining_time": "10:03:36"} +{"current_steps": 3490, "total_steps": 7064, "loss": 0.7924, "reward": null, "learning_rate": 2.5466942309399706e-05, "epoch": 0.99, "percentage": 49.41, "elapsed_time": "9:49:23", "remaining_time": "10:03:35"} +{"current_steps": 3500, "total_steps": 7064, "loss": 0.8001, "reward": null, "learning_rate": 2.535577424779347e-05, "epoch": 0.99, "percentage": 49.55, "elapsed_time": "9:55:00", "remaining_time": "10:05:53"} +{"current_steps": 3500, "total_steps": 7064, "loss": 0.8001, "reward": null, "learning_rate": 2.535577424779347e-05, "epoch": 0.99, "percentage": 49.55, "elapsed_time": "9:51:06", "remaining_time": "10:01:55"} +{"current_steps": 3500, "total_steps": 7064, "loss": 0.8001, "reward": null, "learning_rate": 2.535577424779347e-05, "epoch": 0.99, "percentage": 49.55, "elapsed_time": "9:51:07", "remaining_time": "10:01:56"} +{"current_steps": 3500, "total_steps": 7064, "loss": 0.8001, "reward": null, "learning_rate": 2.535577424779347e-05, "epoch": 0.99, "percentage": 49.55, "elapsed_time": "9:51:08", "remaining_time": "10:01:57"} +{"current_steps": 3510, "total_steps": 7064, "loss": 0.7906, "reward": null, "learning_rate": 2.5244599149436642e-05, "epoch": 0.99, "percentage": 49.69, "elapsed_time": "9:52:53", "remaining_time": "10:00:19"} +{"current_steps": 3510, "total_steps": 7064, "loss": 0.7906, "reward": null, "learning_rate": 2.5244599149436642e-05, "epoch": 0.99, "percentage": 49.69, "elapsed_time": "9:52:51", "remaining_time": "10:00:17"} +{"current_steps": 3510, "total_steps": 7064, "loss": 0.7906, "reward": null, "learning_rate": 2.5244599149436642e-05, "epoch": 0.99, "percentage": 49.69, "elapsed_time": "9:52:52", "remaining_time": "10:00:18"} +{"current_steps": 3510, "total_steps": 7064, "loss": 0.7906, "reward": null, "learning_rate": 2.5244599149436642e-05, "epoch": 0.99, "percentage": 49.69, "elapsed_time": "9:56:45", "remaining_time": "10:04:14"} +{"current_steps": 3520, "total_steps": 7064, "loss": 0.804, "reward": null, "learning_rate": 2.5133419213227684e-05, "epoch": 1.0, "percentage": 49.83, "elapsed_time": "9:54:37", "remaining_time": "9:58:41"} +{"current_steps": 3520, "total_steps": 7064, "loss": 0.804, "reward": null, "learning_rate": 2.5133419213227684e-05, "epoch": 1.0, "percentage": 49.83, "elapsed_time": "9:54:35", "remaining_time": "9:58:39"} +{"current_steps": 3520, "total_steps": 7064, "loss": 0.804, "reward": null, "learning_rate": 2.5133419213227684e-05, "epoch": 1.0, "percentage": 49.83, "elapsed_time": "9:54:36", "remaining_time": "9:58:40"} +{"current_steps": 3520, "total_steps": 7064, "loss": 0.804, "reward": null, "learning_rate": 2.5133419213227684e-05, "epoch": 1.0, "percentage": 49.83, "elapsed_time": "9:58:29", "remaining_time": "10:02:33"} +{"current_steps": 3530, "total_steps": 7064, "loss": 0.8123, "reward": null, "learning_rate": 2.5022236638160712e-05, "epoch": 1.0, "percentage": 49.97, "elapsed_time": "10:00:10", "remaining_time": "10:00:51"} +{"current_steps": 3530, "total_steps": 7064, "loss": 0.8123, "reward": null, "learning_rate": 2.5022236638160712e-05, "epoch": 1.0, "percentage": 49.97, "elapsed_time": "9:56:19", "remaining_time": "9:56:59"} +{"current_steps": 3530, "total_steps": 7064, "loss": 0.8123, "reward": null, "learning_rate": 2.5022236638160712e-05, "epoch": 1.0, "percentage": 49.97, "elapsed_time": "9:56:17", "remaining_time": "9:56:57"} +{"current_steps": 3530, "total_steps": 7064, "loss": 0.8123, "reward": null, "learning_rate": 2.5022236638160712e-05, "epoch": 1.0, "percentage": 49.97, "elapsed_time": "9:56:18", "remaining_time": "9:56:58"} +{"current_steps": 3540, "total_steps": 7064, "loss": 0.8164, "reward": null, "learning_rate": 2.491105362328204e-05, "epoch": 1.0, "percentage": 50.11, "elapsed_time": "9:58:01", "remaining_time": "9:55:19"} +{"current_steps": 3540, "total_steps": 7064, "loss": 0.8164, "reward": null, "learning_rate": 2.491105362328204e-05, "epoch": 1.0, "percentage": 50.11, "elapsed_time": "9:57:59", "remaining_time": "9:55:17"} +{"current_steps": 3540, "total_steps": 7064, "loss": 0.8164, "reward": null, "learning_rate": 2.491105362328204e-05, "epoch": 1.0, "percentage": 50.11, "elapsed_time": "9:58:00", "remaining_time": "9:55:17"} +{"current_steps": 3540, "total_steps": 7064, "loss": 0.8164, "reward": null, "learning_rate": 2.491105362328204e-05, "epoch": 1.0, "percentage": 50.11, "elapsed_time": "10:01:52", "remaining_time": "9:59:09"} +{"current_steps": 3550, "total_steps": 7064, "loss": 0.8169, "reward": null, "learning_rate": 2.4799872367646685e-05, "epoch": 1.01, "percentage": 50.25, "elapsed_time": "9:59:39", "remaining_time": "9:53:34"} +{"current_steps": 3550, "total_steps": 7064, "loss": 0.8169, "reward": null, "learning_rate": 2.4799872367646685e-05, "epoch": 1.01, "percentage": 50.25, "elapsed_time": "9:59:37", "remaining_time": "9:53:32"} +{"current_steps": 3550, "total_steps": 7064, "loss": 0.8169, "reward": null, "learning_rate": 2.4799872367646685e-05, "epoch": 1.01, "percentage": 50.25, "elapsed_time": "9:59:38", "remaining_time": "9:53:33"} +{"current_steps": 3550, "total_steps": 7064, "loss": 0.8169, "reward": null, "learning_rate": 2.4799872367646685e-05, "epoch": 1.01, "percentage": 50.25, "elapsed_time": "10:03:30", "remaining_time": "9:57:23"} +{"current_steps": 3560, "total_steps": 7064, "loss": 0.7835, "reward": null, "learning_rate": 2.468869507027486e-05, "epoch": 1.01, "percentage": 50.4, "elapsed_time": "10:05:12", "remaining_time": "9:55:40"} +{"current_steps": 3560, "total_steps": 7064, "loss": 0.7835, "reward": null, "learning_rate": 2.468869507027486e-05, "epoch": 1.01, "percentage": 50.4, "elapsed_time": "10:01:20", "remaining_time": "9:51:53"} +{"current_steps": 3560, "total_steps": 7064, "loss": 0.7835, "reward": null, "learning_rate": 2.468869507027486e-05, "epoch": 1.01, "percentage": 50.4, "elapsed_time": "10:01:18", "remaining_time": "9:51:51"} +{"current_steps": 3560, "total_steps": 7064, "loss": 0.7835, "reward": null, "learning_rate": 2.468869507027486e-05, "epoch": 1.01, "percentage": 50.4, "elapsed_time": "10:01:19", "remaining_time": "9:51:52"} +{"current_steps": 3570, "total_steps": 7064, "loss": 0.8199, "reward": null, "learning_rate": 2.457752393010851e-05, "epoch": 1.01, "percentage": 50.54, "elapsed_time": "10:03:03", "remaining_time": "9:50:13"} +{"current_steps": 3570, "total_steps": 7064, "loss": 0.8199, "reward": null, "learning_rate": 2.457752393010851e-05, "epoch": 1.01, "percentage": 50.54, "elapsed_time": "10:06:56", "remaining_time": "9:54:00"} +{"current_steps": 3570, "total_steps": 7064, "loss": 0.8199, "reward": null, "learning_rate": 2.457752393010851e-05, "epoch": 1.01, "percentage": 50.54, "elapsed_time": "10:03:02", "remaining_time": "9:50:12"} +{"current_steps": 3570, "total_steps": 7064, "loss": 0.8199, "reward": null, "learning_rate": 2.457752393010851e-05, "epoch": 1.01, "percentage": 50.54, "elapsed_time": "10:03:04", "remaining_time": "9:50:14"} +{"current_steps": 3580, "total_steps": 7064, "loss": 0.8096, "reward": null, "learning_rate": 2.4466361145967782e-05, "epoch": 1.01, "percentage": 50.68, "elapsed_time": "10:04:46", "remaining_time": "9:48:33"} +{"current_steps": 3580, "total_steps": 7064, "loss": 0.8096, "reward": null, "learning_rate": 2.4466361145967782e-05, "epoch": 1.01, "percentage": 50.68, "elapsed_time": "10:08:37", "remaining_time": "9:52:18"} +{"current_steps": 3580, "total_steps": 7064, "loss": 0.8096, "reward": null, "learning_rate": 2.4466361145967782e-05, "epoch": 1.01, "percentage": 50.68, "elapsed_time": "10:04:44", "remaining_time": "9:48:31"} +{"current_steps": 3580, "total_steps": 7064, "loss": 0.8096, "reward": null, "learning_rate": 2.4466361145967782e-05, "epoch": 1.01, "percentage": 50.68, "elapsed_time": "10:04:45", "remaining_time": "9:48:32"} +{"current_steps": 3590, "total_steps": 7064, "loss": 0.7792, "reward": null, "learning_rate": 2.4355208916507554e-05, "epoch": 1.02, "percentage": 50.82, "elapsed_time": "10:10:21", "remaining_time": "9:50:38"} +{"current_steps": 3590, "total_steps": 7064, "loss": 0.7792, "reward": null, "learning_rate": 2.4355208916507554e-05, "epoch": 1.02, "percentage": 50.82, "elapsed_time": "10:06:30", "remaining_time": "9:46:54"} +{"current_steps": 3590, "total_steps": 7064, "loss": 0.7792, "reward": null, "learning_rate": 2.4355208916507554e-05, "epoch": 1.02, "percentage": 50.82, "elapsed_time": "10:06:28", "remaining_time": "9:46:52"} +{"current_steps": 3590, "total_steps": 7064, "loss": 0.7792, "reward": null, "learning_rate": 2.4355208916507554e-05, "epoch": 1.02, "percentage": 50.82, "elapsed_time": "10:06:29", "remaining_time": "9:46:53"} +{"current_steps": 3600, "total_steps": 7064, "loss": 0.7789, "reward": null, "learning_rate": 2.4244069440173938e-05, "epoch": 1.02, "percentage": 50.96, "elapsed_time": "10:08:12", "remaining_time": "9:45:13"} +{"current_steps": 3600, "total_steps": 7064, "loss": 0.7789, "reward": null, "learning_rate": 2.4244069440173938e-05, "epoch": 1.02, "percentage": 50.96, "elapsed_time": "10:08:11", "remaining_time": "9:45:12"} +{"current_steps": 3600, "total_steps": 7064, "loss": 0.7789, "reward": null, "learning_rate": 2.4244069440173938e-05, "epoch": 1.02, "percentage": 50.96, "elapsed_time": "10:08:10", "remaining_time": "9:45:11"} +{"current_steps": 3600, "total_steps": 7064, "loss": 0.7789, "reward": null, "learning_rate": 2.4244069440173938e-05, "epoch": 1.02, "percentage": 50.96, "elapsed_time": "10:12:03", "remaining_time": "9:48:56"} +{"current_steps": 3610, "total_steps": 7064, "loss": 0.8127, "reward": null, "learning_rate": 2.413294491516083e-05, "epoch": 1.02, "percentage": 51.1, "elapsed_time": "10:09:54", "remaining_time": "9:43:33"} +{"current_steps": 3610, "total_steps": 7064, "loss": 0.8127, "reward": null, "learning_rate": 2.413294491516083e-05, "epoch": 1.02, "percentage": 51.1, "elapsed_time": "10:13:46", "remaining_time": "9:47:14"} +{"current_steps": 3610, "total_steps": 7064, "loss": 0.8127, "reward": null, "learning_rate": 2.413294491516083e-05, "epoch": 1.02, "percentage": 51.1, "elapsed_time": "10:09:52", "remaining_time": "9:43:31"} +{"current_steps": 3610, "total_steps": 7064, "loss": 0.8127, "reward": null, "learning_rate": 2.413294491516083e-05, "epoch": 1.02, "percentage": 51.1, "elapsed_time": "10:09:53", "remaining_time": "9:43:32"} +{"current_steps": 3620, "total_steps": 7064, "loss": 0.816, "reward": null, "learning_rate": 2.402183753936639e-05, "epoch": 1.02, "percentage": 51.25, "elapsed_time": "10:15:28", "remaining_time": "9:45:32"} +{"current_steps": 3620, "total_steps": 7064, "loss": 0.816, "reward": null, "learning_rate": 2.402183753936639e-05, "epoch": 1.02, "percentage": 51.25, "elapsed_time": "10:11:35", "remaining_time": "9:41:51"} +{"current_steps": 3620, "total_steps": 7064, "loss": 0.816, "reward": null, "learning_rate": 2.402183753936639e-05, "epoch": 1.02, "percentage": 51.25, "elapsed_time": "10:11:35", "remaining_time": "9:41:50"} +{"current_steps": 3620, "total_steps": 7064, "loss": 0.816, "reward": null, "learning_rate": 2.402183753936639e-05, "epoch": 1.02, "percentage": 51.25, "elapsed_time": "10:11:37", "remaining_time": "9:41:52"} +{"current_steps": 3630, "total_steps": 7064, "loss": 0.8045, "reward": null, "learning_rate": 2.3910749510349574e-05, "epoch": 1.03, "percentage": 51.39, "elapsed_time": "10:17:10", "remaining_time": "9:43:51"} +{"current_steps": 3630, "total_steps": 7064, "loss": 0.8045, "reward": null, "learning_rate": 2.3910749510349574e-05, "epoch": 1.03, "percentage": 51.39, "elapsed_time": "10:13:18", "remaining_time": "9:40:11"} +{"current_steps": 3630, "total_steps": 7064, "loss": 0.8045, "reward": null, "learning_rate": 2.3910749510349574e-05, "epoch": 1.03, "percentage": 51.39, "elapsed_time": "10:13:17", "remaining_time": "9:40:10"} +{"current_steps": 3630, "total_steps": 7064, "loss": 0.8045, "reward": null, "learning_rate": 2.3910749510349574e-05, "epoch": 1.03, "percentage": 51.39, "elapsed_time": "10:13:19", "remaining_time": "9:40:12"} +{"current_steps": 3640, "total_steps": 7064, "loss": 0.8065, "reward": null, "learning_rate": 2.3799683025286727e-05, "epoch": 1.03, "percentage": 51.53, "elapsed_time": "10:18:51", "remaining_time": "9:42:08"} +{"current_steps": 3640, "total_steps": 7064, "loss": 0.8065, "reward": null, "learning_rate": 2.3799683025286727e-05, "epoch": 1.03, "percentage": 51.53, "elapsed_time": "10:15:00", "remaining_time": "9:38:30"} +{"current_steps": 3640, "total_steps": 7064, "loss": 0.8065, "reward": null, "learning_rate": 2.3799683025286727e-05, "epoch": 1.03, "percentage": 51.53, "elapsed_time": "10:14:58", "remaining_time": "9:38:28"} +{"current_steps": 3640, "total_steps": 7064, "loss": 0.8065, "reward": null, "learning_rate": 2.3799683025286727e-05, "epoch": 1.03, "percentage": 51.53, "elapsed_time": "10:14:59", "remaining_time": "9:38:29"} +{"current_steps": 3650, "total_steps": 7064, "loss": 0.8016, "reward": null, "learning_rate": 2.3688640280928043e-05, "epoch": 1.03, "percentage": 51.67, "elapsed_time": "10:16:39", "remaining_time": "9:36:47"} +{"current_steps": 3650, "total_steps": 7064, "loss": 0.8016, "reward": null, "learning_rate": 2.3688640280928043e-05, "epoch": 1.03, "percentage": 51.67, "elapsed_time": "10:16:38", "remaining_time": "9:36:46"} +{"current_steps": 3650, "total_steps": 7064, "loss": 0.8016, "reward": null, "learning_rate": 2.3688640280928043e-05, "epoch": 1.03, "percentage": 51.67, "elapsed_time": "10:16:37", "remaining_time": "9:36:45"} +{"current_steps": 3650, "total_steps": 7064, "loss": 0.8016, "reward": null, "learning_rate": 2.3688640280928043e-05, "epoch": 1.03, "percentage": 51.67, "elapsed_time": "10:20:31", "remaining_time": "9:40:23"} +{"current_steps": 3660, "total_steps": 7064, "loss": 0.7902, "reward": null, "learning_rate": 2.357762347355418e-05, "epoch": 1.04, "percentage": 51.81, "elapsed_time": "10:18:21", "remaining_time": "9:35:06"} +{"current_steps": 3660, "total_steps": 7064, "loss": 0.7902, "reward": null, "learning_rate": 2.357762347355418e-05, "epoch": 1.04, "percentage": 51.81, "elapsed_time": "10:22:12", "remaining_time": "9:38:41"} +{"current_steps": 3660, "total_steps": 7064, "loss": 0.7902, "reward": null, "learning_rate": 2.357762347355418e-05, "epoch": 1.04, "percentage": 51.81, "elapsed_time": "10:18:19", "remaining_time": "9:35:04"} +{"current_steps": 3660, "total_steps": 7064, "loss": 0.7902, "reward": null, "learning_rate": 2.357762347355418e-05, "epoch": 1.04, "percentage": 51.81, "elapsed_time": "10:18:19", "remaining_time": "9:35:04"} +{"current_steps": 3670, "total_steps": 7064, "loss": 0.8044, "reward": null, "learning_rate": 2.346663479893277e-05, "epoch": 1.04, "percentage": 51.95, "elapsed_time": "10:23:52", "remaining_time": "9:36:57"} +{"current_steps": 3670, "total_steps": 7064, "loss": 0.8044, "reward": null, "learning_rate": 2.346663479893277e-05, "epoch": 1.04, "percentage": 51.95, "elapsed_time": "10:20:00", "remaining_time": "9:33:22"} +{"current_steps": 3670, "total_steps": 7064, "loss": 0.8044, "reward": null, "learning_rate": 2.346663479893277e-05, "epoch": 1.04, "percentage": 51.95, "elapsed_time": "10:20:01", "remaining_time": "9:33:23"} +{"current_steps": 3670, "total_steps": 7064, "loss": 0.8044, "reward": null, "learning_rate": 2.346663479893277e-05, "epoch": 1.04, "percentage": 51.95, "elapsed_time": "10:19:59", "remaining_time": "9:33:21"} +{"current_steps": 3680, "total_steps": 7064, "loss": 0.8136, "reward": null, "learning_rate": 2.3355676452275057e-05, "epoch": 1.04, "percentage": 52.1, "elapsed_time": "10:21:43", "remaining_time": "9:31:43"} +{"current_steps": 3680, "total_steps": 7064, "loss": 0.8136, "reward": null, "learning_rate": 2.3355676452275057e-05, "epoch": 1.04, "percentage": 52.1, "elapsed_time": "10:25:35", "remaining_time": "9:35:16"} +{"current_steps": 3680, "total_steps": 7064, "loss": 0.8136, "reward": null, "learning_rate": 2.3355676452275057e-05, "epoch": 1.04, "percentage": 52.1, "elapsed_time": "10:21:41", "remaining_time": "9:31:41"} +{"current_steps": 3680, "total_steps": 7064, "loss": 0.8136, "reward": null, "learning_rate": 2.3355676452275057e-05, "epoch": 1.04, "percentage": 52.1, "elapsed_time": "10:21:42", "remaining_time": "9:31:42"} +{"current_steps": 3690, "total_steps": 7064, "loss": 0.7885, "reward": null, "learning_rate": 2.3244750628192395e-05, "epoch": 1.04, "percentage": 52.24, "elapsed_time": "10:23:24", "remaining_time": "9:30:01"} +{"current_steps": 3690, "total_steps": 7064, "loss": 0.7885, "reward": null, "learning_rate": 2.3244750628192395e-05, "epoch": 1.04, "percentage": 52.24, "elapsed_time": "10:27:16", "remaining_time": "9:33:33"} +{"current_steps": 3690, "total_steps": 7064, "loss": 0.7885, "reward": null, "learning_rate": 2.3244750628192395e-05, "epoch": 1.04, "percentage": 52.24, "elapsed_time": "10:23:22", "remaining_time": "9:29:59"} +{"current_steps": 3690, "total_steps": 7064, "loss": 0.7885, "reward": null, "learning_rate": 2.3244750628192395e-05, "epoch": 1.04, "percentage": 52.24, "elapsed_time": "10:23:23", "remaining_time": "9:30:00"} +{"current_steps": 3700, "total_steps": 7064, "loss": 0.7734, "reward": null, "learning_rate": 2.313385952065291e-05, "epoch": 1.05, "percentage": 52.38, "elapsed_time": "10:28:58", "remaining_time": "9:31:51"} +{"current_steps": 3700, "total_steps": 7064, "loss": 0.7734, "reward": null, "learning_rate": 2.313385952065291e-05, "epoch": 1.05, "percentage": 52.38, "elapsed_time": "10:25:07", "remaining_time": "9:28:21"} +{"current_steps": 3700, "total_steps": 7064, "loss": 0.7734, "reward": null, "learning_rate": 2.313385952065291e-05, "epoch": 1.05, "percentage": 52.38, "elapsed_time": "10:25:06", "remaining_time": "9:28:20"} +{"current_steps": 3700, "total_steps": 7064, "loss": 0.7734, "reward": null, "learning_rate": 2.313385952065291e-05, "epoch": 1.05, "percentage": 52.38, "elapsed_time": "10:25:05", "remaining_time": "9:28:19"} +{"current_steps": 3710, "total_steps": 7064, "loss": 0.8117, "reward": null, "learning_rate": 2.302300532293806e-05, "epoch": 1.05, "percentage": 52.52, "elapsed_time": "10:26:47", "remaining_time": "9:26:38"} +{"current_steps": 3710, "total_steps": 7064, "loss": 0.8117, "reward": null, "learning_rate": 2.302300532293806e-05, "epoch": 1.05, "percentage": 52.52, "elapsed_time": "10:26:49", "remaining_time": "9:26:40"} +{"current_steps": 3710, "total_steps": 7064, "loss": 0.8117, "reward": null, "learning_rate": 2.302300532293806e-05, "epoch": 1.05, "percentage": 52.52, "elapsed_time": "10:26:48", "remaining_time": "9:26:39"} +{"current_steps": 3710, "total_steps": 7064, "loss": 0.8117, "reward": null, "learning_rate": 2.302300532293806e-05, "epoch": 1.05, "percentage": 52.52, "elapsed_time": "10:30:40", "remaining_time": "9:30:09"} +{"current_steps": 3720, "total_steps": 7064, "loss": 0.7969, "reward": null, "learning_rate": 2.2912190227599305e-05, "epoch": 1.05, "percentage": 52.66, "elapsed_time": "10:28:32", "remaining_time": "9:25:00"} +{"current_steps": 3720, "total_steps": 7064, "loss": 0.7969, "reward": null, "learning_rate": 2.2912190227599305e-05, "epoch": 1.05, "percentage": 52.66, "elapsed_time": "10:32:23", "remaining_time": "9:28:28"} +{"current_steps": 3720, "total_steps": 7064, "loss": 0.7969, "reward": null, "learning_rate": 2.2912190227599305e-05, "epoch": 1.05, "percentage": 52.66, "elapsed_time": "10:28:31", "remaining_time": "9:24:59"} +{"current_steps": 3720, "total_steps": 7064, "loss": 0.7969, "reward": null, "learning_rate": 2.2912190227599305e-05, "epoch": 1.05, "percentage": 52.66, "elapsed_time": "10:28:30", "remaining_time": "9:24:58"} +{"current_steps": 3730, "total_steps": 7064, "loss": 0.7741, "reward": null, "learning_rate": 2.280141642641468e-05, "epoch": 1.06, "percentage": 52.8, "elapsed_time": "10:30:13", "remaining_time": "9:23:18"} +{"current_steps": 3730, "total_steps": 7064, "loss": 0.7741, "reward": null, "learning_rate": 2.280141642641468e-05, "epoch": 1.06, "percentage": 52.8, "elapsed_time": "10:34:04", "remaining_time": "9:26:45"} +{"current_steps": 3730, "total_steps": 7064, "loss": 0.7741, "reward": null, "learning_rate": 2.280141642641468e-05, "epoch": 1.06, "percentage": 52.8, "elapsed_time": "10:30:11", "remaining_time": "9:23:17"} +{"current_steps": 3730, "total_steps": 7064, "loss": 0.7741, "reward": null, "learning_rate": 2.280141642641468e-05, "epoch": 1.06, "percentage": 52.8, "elapsed_time": "10:30:12", "remaining_time": "9:23:17"} +{"current_steps": 3740, "total_steps": 7064, "loss": 0.7996, "reward": null, "learning_rate": 2.26906861103455e-05, "epoch": 1.06, "percentage": 52.94, "elapsed_time": "10:35:48", "remaining_time": "9:25:05"} +{"current_steps": 3740, "total_steps": 7064, "loss": 0.7996, "reward": null, "learning_rate": 2.26906861103455e-05, "epoch": 1.06, "percentage": 52.94, "elapsed_time": "10:31:55", "remaining_time": "9:21:38"} +{"current_steps": 3740, "total_steps": 7064, "loss": 0.7996, "reward": null, "learning_rate": 2.26906861103455e-05, "epoch": 1.06, "percentage": 52.94, "elapsed_time": "10:31:56", "remaining_time": "9:21:38"} +{"current_steps": 3740, "total_steps": 7064, "loss": 0.7996, "reward": null, "learning_rate": 2.26906861103455e-05, "epoch": 1.06, "percentage": 52.94, "elapsed_time": "10:31:57", "remaining_time": "9:21:39"} +{"current_steps": 3750, "total_steps": 7064, "loss": 0.806, "reward": null, "learning_rate": 2.2580001469492968e-05, "epoch": 1.06, "percentage": 53.09, "elapsed_time": "10:37:34", "remaining_time": "9:23:26"} +{"current_steps": 3750, "total_steps": 7064, "loss": 0.806, "reward": null, "learning_rate": 2.2580001469492968e-05, "epoch": 1.06, "percentage": 53.09, "elapsed_time": "10:33:43", "remaining_time": "9:20:02"} +{"current_steps": 3750, "total_steps": 7064, "loss": 0.806, "reward": null, "learning_rate": 2.2580001469492968e-05, "epoch": 1.06, "percentage": 53.09, "elapsed_time": "10:33:41", "remaining_time": "9:20:00"} +{"current_steps": 3750, "total_steps": 7064, "loss": 0.806, "reward": null, "learning_rate": 2.2580001469492968e-05, "epoch": 1.06, "percentage": 53.09, "elapsed_time": "10:33:42", "remaining_time": "9:20:01"} +{"current_steps": 3760, "total_steps": 7064, "loss": 0.7969, "reward": null, "learning_rate": 2.2469364693054938e-05, "epoch": 1.06, "percentage": 53.23, "elapsed_time": "10:35:22", "remaining_time": "9:18:19"} +{"current_steps": 3760, "total_steps": 7064, "loss": 0.7969, "reward": null, "learning_rate": 2.2469364693054938e-05, "epoch": 1.06, "percentage": 53.23, "elapsed_time": "10:39:14", "remaining_time": "9:21:42"} +{"current_steps": 3760, "total_steps": 7064, "loss": 0.7969, "reward": null, "learning_rate": 2.2469364693054938e-05, "epoch": 1.06, "percentage": 53.23, "elapsed_time": "10:35:21", "remaining_time": "9:18:18"} +{"current_steps": 3760, "total_steps": 7064, "loss": 0.7969, "reward": null, "learning_rate": 2.2469364693054938e-05, "epoch": 1.06, "percentage": 53.23, "elapsed_time": "10:35:20", "remaining_time": "9:18:17"} +{"current_steps": 3770, "total_steps": 7064, "loss": 0.8017, "reward": null, "learning_rate": 2.235877796928252e-05, "epoch": 1.07, "percentage": 53.37, "elapsed_time": "10:40:58", "remaining_time": "9:20:03"} +{"current_steps": 3770, "total_steps": 7064, "loss": 0.8017, "reward": null, "learning_rate": 2.235877796928252e-05, "epoch": 1.07, "percentage": 53.37, "elapsed_time": "10:37:06", "remaining_time": "9:16:40"} +{"current_steps": 3770, "total_steps": 7064, "loss": 0.8017, "reward": null, "learning_rate": 2.235877796928252e-05, "epoch": 1.07, "percentage": 53.37, "elapsed_time": "10:37:07", "remaining_time": "9:16:40"} +{"current_steps": 3770, "total_steps": 7064, "loss": 0.8017, "reward": null, "learning_rate": 2.235877796928252e-05, "epoch": 1.07, "percentage": 53.37, "elapsed_time": "10:37:05", "remaining_time": "9:16:39"} +{"current_steps": 3780, "total_steps": 7064, "loss": 0.8066, "reward": null, "learning_rate": 2.2248243485436892e-05, "epoch": 1.07, "percentage": 53.51, "elapsed_time": "10:38:50", "remaining_time": "9:15:01"} +{"current_steps": 3780, "total_steps": 7064, "loss": 0.8066, "reward": null, "learning_rate": 2.2248243485436892e-05, "epoch": 1.07, "percentage": 53.51, "elapsed_time": "10:42:41", "remaining_time": "9:18:21"} +{"current_steps": 3780, "total_steps": 7064, "loss": 0.8066, "reward": null, "learning_rate": 2.2248243485436892e-05, "epoch": 1.07, "percentage": 53.51, "elapsed_time": "10:38:48", "remaining_time": "9:14:59"} +{"current_steps": 3780, "total_steps": 7064, "loss": 0.8066, "reward": null, "learning_rate": 2.2248243485436892e-05, "epoch": 1.07, "percentage": 53.51, "elapsed_time": "10:38:49", "remaining_time": "9:15:00"} +{"current_steps": 3790, "total_steps": 7064, "loss": 0.7969, "reward": null, "learning_rate": 2.213776342774595e-05, "epoch": 1.07, "percentage": 53.65, "elapsed_time": "10:44:21", "remaining_time": "9:16:38"} +{"current_steps": 3790, "total_steps": 7064, "loss": 0.7969, "reward": null, "learning_rate": 2.213776342774595e-05, "epoch": 1.07, "percentage": 53.65, "elapsed_time": "10:40:29", "remaining_time": "9:13:17"} +{"current_steps": 3790, "total_steps": 7064, "loss": 0.7969, "reward": null, "learning_rate": 2.213776342774595e-05, "epoch": 1.07, "percentage": 53.65, "elapsed_time": "10:40:28", "remaining_time": "9:13:16"} +{"current_steps": 3790, "total_steps": 7064, "loss": 0.7969, "reward": null, "learning_rate": 2.213776342774595e-05, "epoch": 1.07, "percentage": 53.65, "elapsed_time": "10:40:30", "remaining_time": "9:13:18"} +{"current_steps": 3800, "total_steps": 7064, "loss": 0.8008, "reward": null, "learning_rate": 2.2027339981361156e-05, "epoch": 1.08, "percentage": 53.79, "elapsed_time": "10:42:13", "remaining_time": "9:11:37"} +{"current_steps": 3800, "total_steps": 7064, "loss": 0.8008, "reward": null, "learning_rate": 2.2027339981361156e-05, "epoch": 1.08, "percentage": 53.79, "elapsed_time": "10:46:04", "remaining_time": "9:14:56"} +{"current_steps": 3800, "total_steps": 7064, "loss": 0.8008, "reward": null, "learning_rate": 2.2027339981361156e-05, "epoch": 1.08, "percentage": 53.79, "elapsed_time": "10:42:12", "remaining_time": "9:11:37"} +{"current_steps": 3800, "total_steps": 7064, "loss": 0.8008, "reward": null, "learning_rate": 2.2027339981361156e-05, "epoch": 1.08, "percentage": 53.79, "elapsed_time": "10:42:11", "remaining_time": "9:11:36"} +{"current_steps": 3810, "total_steps": 7064, "loss": 0.8111, "reward": null, "learning_rate": 2.1916975330314235e-05, "epoch": 1.08, "percentage": 53.94, "elapsed_time": "10:43:50", "remaining_time": "9:09:52"} +{"current_steps": 3810, "total_steps": 7064, "loss": 0.8111, "reward": null, "learning_rate": 2.1916975330314235e-05, "epoch": 1.08, "percentage": 53.94, "elapsed_time": "10:47:41", "remaining_time": "9:13:10"} +{"current_steps": 3810, "total_steps": 7064, "loss": 0.8111, "reward": null, "learning_rate": 2.1916975330314235e-05, "epoch": 1.08, "percentage": 53.94, "elapsed_time": "10:43:48", "remaining_time": "9:09:51"} +{"current_steps": 3810, "total_steps": 7064, "loss": 0.8111, "reward": null, "learning_rate": 2.1916975330314235e-05, "epoch": 1.08, "percentage": 53.94, "elapsed_time": "10:43:49", "remaining_time": "9:09:51"} +{"current_steps": 3820, "total_steps": 7064, "loss": 0.7797, "reward": null, "learning_rate": 2.1806671657474048e-05, "epoch": 1.08, "percentage": 54.08, "elapsed_time": "10:45:33", "remaining_time": "9:08:13"} +{"current_steps": 3820, "total_steps": 7064, "loss": 0.7797, "reward": null, "learning_rate": 2.1806671657474048e-05, "epoch": 1.08, "percentage": 54.08, "elapsed_time": "10:45:31", "remaining_time": "9:08:11"} +{"current_steps": 3820, "total_steps": 7064, "loss": 0.7797, "reward": null, "learning_rate": 2.1806671657474048e-05, "epoch": 1.08, "percentage": 54.08, "elapsed_time": "10:45:32", "remaining_time": "9:08:12"} +{"current_steps": 3820, "total_steps": 7064, "loss": 0.7797, "reward": null, "learning_rate": 2.1806671657474048e-05, "epoch": 1.08, "percentage": 54.08, "elapsed_time": "10:49:24", "remaining_time": "9:11:29"} +{"current_steps": 3830, "total_steps": 7064, "loss": 0.8016, "reward": null, "learning_rate": 2.1696431144503356e-05, "epoch": 1.08, "percentage": 54.22, "elapsed_time": "10:47:12", "remaining_time": "9:06:29"} +{"current_steps": 3830, "total_steps": 7064, "loss": 0.8016, "reward": null, "learning_rate": 2.1696431144503356e-05, "epoch": 1.08, "percentage": 54.22, "elapsed_time": "10:47:10", "remaining_time": "9:06:27"} +{"current_steps": 3830, "total_steps": 7064, "loss": 0.8016, "reward": null, "learning_rate": 2.1696431144503356e-05, "epoch": 1.08, "percentage": 54.22, "elapsed_time": "10:47:11", "remaining_time": "9:06:28"} +{"current_steps": 3830, "total_steps": 7064, "loss": 0.8016, "reward": null, "learning_rate": 2.1696431144503356e-05, "epoch": 1.08, "percentage": 54.22, "elapsed_time": "10:51:03", "remaining_time": "9:09:44"} +{"current_steps": 3840, "total_steps": 7064, "loss": 0.7962, "reward": null, "learning_rate": 2.1586255971815738e-05, "epoch": 1.09, "percentage": 54.36, "elapsed_time": "10:48:57", "remaining_time": "9:04:51"} +{"current_steps": 3840, "total_steps": 7064, "loss": 0.7962, "reward": null, "learning_rate": 2.1586255971815738e-05, "epoch": 1.09, "percentage": 54.36, "elapsed_time": "10:48:56", "remaining_time": "9:04:50"} +{"current_steps": 3840, "total_steps": 7064, "loss": 0.7962, "reward": null, "learning_rate": 2.1586255971815738e-05, "epoch": 1.09, "percentage": 54.36, "elapsed_time": "10:48:55", "remaining_time": "9:04:49"} +{"current_steps": 3840, "total_steps": 7064, "loss": 0.7962, "reward": null, "learning_rate": 2.1586255971815738e-05, "epoch": 1.09, "percentage": 54.36, "elapsed_time": "10:52:48", "remaining_time": "9:08:05"} +{"current_steps": 3850, "total_steps": 7064, "loss": 0.7897, "reward": null, "learning_rate": 2.147614831853239e-05, "epoch": 1.09, "percentage": 54.5, "elapsed_time": "10:50:39", "remaining_time": "9:03:10"} +{"current_steps": 3850, "total_steps": 7064, "loss": 0.7897, "reward": null, "learning_rate": 2.147614831853239e-05, "epoch": 1.09, "percentage": 54.5, "elapsed_time": "10:54:31", "remaining_time": "9:06:23"} +{"current_steps": 3850, "total_steps": 7064, "loss": 0.7897, "reward": null, "learning_rate": 2.147614831853239e-05, "epoch": 1.09, "percentage": 54.5, "elapsed_time": "10:50:37", "remaining_time": "9:03:08"} +{"current_steps": 3850, "total_steps": 7064, "loss": 0.7897, "reward": null, "learning_rate": 2.147614831853239e-05, "epoch": 1.09, "percentage": 54.5, "elapsed_time": "10:50:38", "remaining_time": "9:03:09"} +{"current_steps": 3860, "total_steps": 7064, "loss": 0.7951, "reward": null, "learning_rate": 2.136611036243908e-05, "epoch": 1.09, "percentage": 54.64, "elapsed_time": "10:52:20", "remaining_time": "9:01:28"} +{"current_steps": 3860, "total_steps": 7064, "loss": 0.7951, "reward": null, "learning_rate": 2.136611036243908e-05, "epoch": 1.09, "percentage": 54.64, "elapsed_time": "10:52:18", "remaining_time": "9:01:27"} +{"current_steps": 3860, "total_steps": 7064, "loss": 0.7951, "reward": null, "learning_rate": 2.136611036243908e-05, "epoch": 1.09, "percentage": 54.64, "elapsed_time": "10:52:19", "remaining_time": "9:01:27"} +{"current_steps": 3860, "total_steps": 7064, "loss": 0.7951, "reward": null, "learning_rate": 2.136611036243908e-05, "epoch": 1.09, "percentage": 54.64, "elapsed_time": "10:56:11", "remaining_time": "9:04:40"} +{"current_steps": 3870, "total_steps": 7064, "loss": 0.7856, "reward": null, "learning_rate": 2.1256144279943066e-05, "epoch": 1.1, "percentage": 54.78, "elapsed_time": "10:54:01", "remaining_time": "8:59:46"} +{"current_steps": 3870, "total_steps": 7064, "loss": 0.7856, "reward": null, "learning_rate": 2.1256144279943066e-05, "epoch": 1.1, "percentage": 54.78, "elapsed_time": "10:53:59", "remaining_time": "8:59:44"} +{"current_steps": 3870, "total_steps": 7064, "loss": 0.7856, "reward": null, "learning_rate": 2.1256144279943066e-05, "epoch": 1.1, "percentage": 54.78, "elapsed_time": "10:53:59", "remaining_time": "8:59:45"} +{"current_steps": 3870, "total_steps": 7064, "loss": 0.7856, "reward": null, "learning_rate": 2.1256144279943066e-05, "epoch": 1.1, "percentage": 54.78, "elapsed_time": "10:57:52", "remaining_time": "9:02:57"} +{"current_steps": 3880, "total_steps": 7064, "loss": 0.7823, "reward": null, "learning_rate": 2.114625224603002e-05, "epoch": 1.1, "percentage": 54.93, "elapsed_time": "10:55:47", "remaining_time": "8:58:09"} +{"current_steps": 3880, "total_steps": 7064, "loss": 0.7823, "reward": null, "learning_rate": 2.114625224603002e-05, "epoch": 1.1, "percentage": 54.93, "elapsed_time": "10:59:39", "remaining_time": "9:01:19"} +{"current_steps": 3880, "total_steps": 7064, "loss": 0.7823, "reward": null, "learning_rate": 2.114625224603002e-05, "epoch": 1.1, "percentage": 54.93, "elapsed_time": "10:55:45", "remaining_time": "8:58:07"} +{"current_steps": 3880, "total_steps": 7064, "loss": 0.7823, "reward": null, "learning_rate": 2.114625224603002e-05, "epoch": 1.1, "percentage": 54.93, "elapsed_time": "10:55:46", "remaining_time": "8:58:08"} +{"current_steps": 3890, "total_steps": 7064, "loss": 0.8101, "reward": null, "learning_rate": 2.1036436434221048e-05, "epoch": 1.1, "percentage": 55.07, "elapsed_time": "10:57:36", "remaining_time": "8:56:34"} +{"current_steps": 3890, "total_steps": 7064, "loss": 0.8101, "reward": null, "learning_rate": 2.1036436434221048e-05, "epoch": 1.1, "percentage": 55.07, "elapsed_time": "11:01:27", "remaining_time": "8:59:42"} +{"current_steps": 3890, "total_steps": 7064, "loss": 0.8101, "reward": null, "learning_rate": 2.1036436434221048e-05, "epoch": 1.1, "percentage": 55.07, "elapsed_time": "10:57:35", "remaining_time": "8:56:33"} +{"current_steps": 3890, "total_steps": 7064, "loss": 0.8101, "reward": null, "learning_rate": 2.1036436434221048e-05, "epoch": 1.1, "percentage": 55.07, "elapsed_time": "10:57:34", "remaining_time": "8:56:32"} +{"current_steps": 3900, "total_steps": 7064, "loss": 0.7789, "reward": null, "learning_rate": 2.0926699016529656e-05, "epoch": 1.1, "percentage": 55.21, "elapsed_time": "10:59:16", "remaining_time": "8:54:51"} +{"current_steps": 3900, "total_steps": 7064, "loss": 0.7789, "reward": null, "learning_rate": 2.0926699016529656e-05, "epoch": 1.1, "percentage": 55.21, "elapsed_time": "10:59:15", "remaining_time": "8:54:50"} +{"current_steps": 3900, "total_steps": 7064, "loss": 0.7789, "reward": null, "learning_rate": 2.0926699016529656e-05, "epoch": 1.1, "percentage": 55.21, "elapsed_time": "10:59:14", "remaining_time": "8:54:49"} +{"current_steps": 3900, "total_steps": 7064, "loss": 0.7789, "reward": null, "learning_rate": 2.0926699016529656e-05, "epoch": 1.1, "percentage": 55.21, "elapsed_time": "11:03:07", "remaining_time": "8:57:59"} +{"current_steps": 3910, "total_steps": 7064, "loss": 0.7993, "reward": null, "learning_rate": 2.0817042163418858e-05, "epoch": 1.11, "percentage": 55.35, "elapsed_time": "11:00:55", "remaining_time": "8:53:07"} +{"current_steps": 3910, "total_steps": 7064, "loss": 0.7993, "reward": null, "learning_rate": 2.0817042163418858e-05, "epoch": 1.11, "percentage": 55.35, "elapsed_time": "11:04:48", "remaining_time": "8:56:16"} +{"current_steps": 3910, "total_steps": 7064, "loss": 0.7993, "reward": null, "learning_rate": 2.0817042163418858e-05, "epoch": 1.11, "percentage": 55.35, "elapsed_time": "11:00:56", "remaining_time": "8:53:08"} +{"current_steps": 3910, "total_steps": 7064, "loss": 0.7993, "reward": null, "learning_rate": 2.0817042163418858e-05, "epoch": 1.11, "percentage": 55.35, "elapsed_time": "11:00:57", "remaining_time": "8:53:09"} +{"current_steps": 3920, "total_steps": 7064, "loss": 0.8107, "reward": null, "learning_rate": 2.0707468043758156e-05, "epoch": 1.11, "percentage": 55.49, "elapsed_time": "11:02:38", "remaining_time": "8:51:27"} +{"current_steps": 3920, "total_steps": 7064, "loss": 0.8107, "reward": null, "learning_rate": 2.0707468043758156e-05, "epoch": 1.11, "percentage": 55.49, "elapsed_time": "11:06:29", "remaining_time": "8:54:33"} +{"current_steps": 3920, "total_steps": 7064, "loss": 0.8107, "reward": null, "learning_rate": 2.0707468043758156e-05, "epoch": 1.11, "percentage": 55.49, "elapsed_time": "11:02:36", "remaining_time": "8:51:26"} +{"current_steps": 3920, "total_steps": 7064, "loss": 0.8107, "reward": null, "learning_rate": 2.0707468043758156e-05, "epoch": 1.11, "percentage": 55.49, "elapsed_time": "11:02:37", "remaining_time": "8:51:27"} +{"current_steps": 3930, "total_steps": 7064, "loss": 0.8005, "reward": null, "learning_rate": 2.059797882478074e-05, "epoch": 1.11, "percentage": 55.63, "elapsed_time": "11:04:18", "remaining_time": "8:49:45"} +{"current_steps": 3930, "total_steps": 7064, "loss": 0.8005, "reward": null, "learning_rate": 2.059797882478074e-05, "epoch": 1.11, "percentage": 55.63, "elapsed_time": "11:04:17", "remaining_time": "8:49:44"} +{"current_steps": 3930, "total_steps": 7064, "loss": 0.8005, "reward": null, "learning_rate": 2.059797882478074e-05, "epoch": 1.11, "percentage": 55.63, "elapsed_time": "11:04:16", "remaining_time": "8:49:43"} +{"current_steps": 3930, "total_steps": 7064, "loss": 0.8005, "reward": null, "learning_rate": 2.059797882478074e-05, "epoch": 1.11, "percentage": 55.63, "elapsed_time": "11:08:09", "remaining_time": "8:52:49"} +{"current_steps": 3940, "total_steps": 7064, "loss": 0.8144, "reward": null, "learning_rate": 2.048857667204053e-05, "epoch": 1.12, "percentage": 55.78, "elapsed_time": "11:09:55", "remaining_time": "8:51:10"} +{"current_steps": 3940, "total_steps": 7064, "loss": 0.8144, "reward": null, "learning_rate": 2.048857667204053e-05, "epoch": 1.12, "percentage": 55.78, "elapsed_time": "11:06:02", "remaining_time": "8:48:06"} +{"current_steps": 3940, "total_steps": 7064, "loss": 0.8144, "reward": null, "learning_rate": 2.048857667204053e-05, "epoch": 1.12, "percentage": 55.78, "elapsed_time": "11:06:01", "remaining_time": "8:48:05"} +{"current_steps": 3940, "total_steps": 7064, "loss": 0.8144, "reward": null, "learning_rate": 2.048857667204053e-05, "epoch": 1.12, "percentage": 55.78, "elapsed_time": "11:06:03", "remaining_time": "8:48:07"} +{"current_steps": 3950, "total_steps": 7064, "loss": 0.7894, "reward": null, "learning_rate": 2.0379263749369434e-05, "epoch": 1.12, "percentage": 55.92, "elapsed_time": "11:07:45", "remaining_time": "8:46:25"} +{"current_steps": 3950, "total_steps": 7064, "loss": 0.7894, "reward": null, "learning_rate": 2.0379263749369434e-05, "epoch": 1.12, "percentage": 55.92, "elapsed_time": "11:11:36", "remaining_time": "8:49:28"} +{"current_steps": 3950, "total_steps": 7064, "loss": 0.7894, "reward": null, "learning_rate": 2.0379263749369434e-05, "epoch": 1.12, "percentage": 55.92, "elapsed_time": "11:07:44", "remaining_time": "8:46:24"} +{"current_steps": 3950, "total_steps": 7064, "loss": 0.7894, "reward": null, "learning_rate": 2.0379263749369434e-05, "epoch": 1.12, "percentage": 55.92, "elapsed_time": "11:07:43", "remaining_time": "8:46:24"} +{"current_steps": 3960, "total_steps": 7064, "loss": 0.7763, "reward": null, "learning_rate": 2.027004221883447e-05, "epoch": 1.12, "percentage": 56.06, "elapsed_time": "11:09:27", "remaining_time": "8:44:44"} +{"current_steps": 3960, "total_steps": 7064, "loss": 0.7763, "reward": null, "learning_rate": 2.027004221883447e-05, "epoch": 1.12, "percentage": 56.06, "elapsed_time": "11:13:18", "remaining_time": "8:47:45"} +{"current_steps": 3960, "total_steps": 7064, "loss": 0.7763, "reward": null, "learning_rate": 2.027004221883447e-05, "epoch": 1.12, "percentage": 56.06, "elapsed_time": "11:09:26", "remaining_time": "8:44:43"} +{"current_steps": 3960, "total_steps": 7064, "loss": 0.7763, "reward": null, "learning_rate": 2.027004221883447e-05, "epoch": 1.12, "percentage": 56.06, "elapsed_time": "11:09:25", "remaining_time": "8:44:43"} +{"current_steps": 3970, "total_steps": 7064, "loss": 0.781, "reward": null, "learning_rate": 2.016091424069506e-05, "epoch": 1.12, "percentage": 56.2, "elapsed_time": "11:11:06", "remaining_time": "8:43:01"} +{"current_steps": 3970, "total_steps": 7064, "loss": 0.781, "reward": null, "learning_rate": 2.016091424069506e-05, "epoch": 1.12, "percentage": 56.2, "elapsed_time": "11:14:57", "remaining_time": "8:46:01"} +{"current_steps": 3970, "total_steps": 7064, "loss": 0.781, "reward": null, "learning_rate": 2.016091424069506e-05, "epoch": 1.12, "percentage": 56.2, "elapsed_time": "11:11:04", "remaining_time": "8:43:00"} +{"current_steps": 3970, "total_steps": 7064, "loss": 0.781, "reward": null, "learning_rate": 2.016091424069506e-05, "epoch": 1.12, "percentage": 56.2, "elapsed_time": "11:11:04", "remaining_time": "8:42:59"} +{"current_steps": 3980, "total_steps": 7064, "loss": 0.7878, "reward": null, "learning_rate": 2.0051881973360266e-05, "epoch": 1.13, "percentage": 56.34, "elapsed_time": "11:12:46", "remaining_time": "8:41:19"} +{"current_steps": 3980, "total_steps": 7064, "loss": 0.7878, "reward": null, "learning_rate": 2.0051881973360266e-05, "epoch": 1.13, "percentage": 56.34, "elapsed_time": "11:16:38", "remaining_time": "8:44:18"} +{"current_steps": 3980, "total_steps": 7064, "loss": 0.7878, "reward": null, "learning_rate": 2.0051881973360266e-05, "epoch": 1.13, "percentage": 56.34, "elapsed_time": "11:12:44", "remaining_time": "8:41:17"} +{"current_steps": 3980, "total_steps": 7064, "loss": 0.7878, "reward": null, "learning_rate": 2.0051881973360266e-05, "epoch": 1.13, "percentage": 56.34, "elapsed_time": "11:12:45", "remaining_time": "8:41:18"} +{"current_steps": 3990, "total_steps": 7064, "loss": 0.7956, "reward": null, "learning_rate": 1.9942947573346133e-05, "epoch": 1.13, "percentage": 56.48, "elapsed_time": "11:18:20", "remaining_time": "8:42:36"} +{"current_steps": 3990, "total_steps": 7064, "loss": 0.7956, "reward": null, "learning_rate": 1.9942947573346133e-05, "epoch": 1.13, "percentage": 56.48, "elapsed_time": "11:14:29", "remaining_time": "8:39:38"} +{"current_steps": 3990, "total_steps": 7064, "loss": 0.7956, "reward": null, "learning_rate": 1.9942947573346133e-05, "epoch": 1.13, "percentage": 56.48, "elapsed_time": "11:14:27", "remaining_time": "8:39:37"} +{"current_steps": 3990, "total_steps": 7064, "loss": 0.7956, "reward": null, "learning_rate": 1.9942947573346133e-05, "epoch": 1.13, "percentage": 56.48, "elapsed_time": "11:14:28", "remaining_time": "8:39:37"} +{"current_steps": 4000, "total_steps": 7064, "loss": 0.8036, "reward": null, "learning_rate": 1.9834113195233e-05, "epoch": 1.13, "percentage": 56.63, "elapsed_time": "11:16:10", "remaining_time": "8:37:57"} +{"current_steps": 4000, "total_steps": 7064, "loss": 0.8036, "reward": null, "learning_rate": 1.9834113195233e-05, "epoch": 1.13, "percentage": 56.63, "elapsed_time": "11:20:02", "remaining_time": "8:40:54"} +{"current_steps": 4000, "total_steps": 7064, "loss": 0.8036, "reward": null, "learning_rate": 1.9834113195233e-05, "epoch": 1.13, "percentage": 56.63, "elapsed_time": "11:16:09", "remaining_time": "8:37:56"} +{"current_steps": 4000, "total_steps": 7064, "loss": 0.8036, "reward": null, "learning_rate": 1.9834113195233e-05, "epoch": 1.13, "percentage": 56.63, "elapsed_time": "11:16:08", "remaining_time": "8:37:55"} +{"current_steps": 4010, "total_steps": 7064, "loss": 0.7945, "reward": null, "learning_rate": 1.9725380991622923e-05, "epoch": 1.14, "percentage": 56.77, "elapsed_time": "11:17:57", "remaining_time": "8:36:19"} +{"current_steps": 4010, "total_steps": 7064, "loss": 0.7945, "reward": null, "learning_rate": 1.9725380991622923e-05, "epoch": 1.14, "percentage": 56.77, "elapsed_time": "11:21:48", "remaining_time": "8:39:16"} +{"current_steps": 4010, "total_steps": 7064, "loss": 0.7945, "reward": null, "learning_rate": 1.9725380991622923e-05, "epoch": 1.14, "percentage": 56.77, "elapsed_time": "11:17:56", "remaining_time": "8:36:19"} +{"current_steps": 4010, "total_steps": 7064, "loss": 0.7945, "reward": null, "learning_rate": 1.9725380991622923e-05, "epoch": 1.14, "percentage": 56.77, "elapsed_time": "11:17:55", "remaining_time": "8:36:18"} +{"current_steps": 4020, "total_steps": 7064, "loss": 0.7955, "reward": null, "learning_rate": 1.961675311309705e-05, "epoch": 1.14, "percentage": 56.91, "elapsed_time": "11:19:38", "remaining_time": "8:34:37"} +{"current_steps": 4020, "total_steps": 7064, "loss": 0.7955, "reward": null, "learning_rate": 1.961675311309705e-05, "epoch": 1.14, "percentage": 56.91, "elapsed_time": "11:19:37", "remaining_time": "8:34:37"} +{"current_steps": 4020, "total_steps": 7064, "loss": 0.7955, "reward": null, "learning_rate": 1.961675311309705e-05, "epoch": 1.14, "percentage": 56.91, "elapsed_time": "11:19:36", "remaining_time": "8:34:36"} +{"current_steps": 4020, "total_steps": 7064, "loss": 0.7955, "reward": null, "learning_rate": 1.961675311309705e-05, "epoch": 1.14, "percentage": 56.91, "elapsed_time": "11:23:29", "remaining_time": "8:37:33"} +{"current_steps": 4030, "total_steps": 7064, "loss": 0.7772, "reward": null, "learning_rate": 1.9508231708173146e-05, "epoch": 1.14, "percentage": 57.05, "elapsed_time": "11:21:18", "remaining_time": "8:32:55"} +{"current_steps": 4030, "total_steps": 7064, "loss": 0.7772, "reward": null, "learning_rate": 1.9508231708173146e-05, "epoch": 1.14, "percentage": 57.05, "elapsed_time": "11:25:09", "remaining_time": "8:35:49"} +{"current_steps": 4030, "total_steps": 7064, "loss": 0.7772, "reward": null, "learning_rate": 1.9508231708173146e-05, "epoch": 1.14, "percentage": 57.05, "elapsed_time": "11:21:16", "remaining_time": "8:32:53"} +{"current_steps": 4030, "total_steps": 7064, "loss": 0.7772, "reward": null, "learning_rate": 1.9508231708173146e-05, "epoch": 1.14, "percentage": 57.05, "elapsed_time": "11:21:17", "remaining_time": "8:32:54"} +{"current_steps": 4040, "total_steps": 7064, "loss": 0.7805, "reward": null, "learning_rate": 1.9399818923263056e-05, "epoch": 1.14, "percentage": 57.19, "elapsed_time": "11:23:01", "remaining_time": "8:31:14"} +{"current_steps": 4040, "total_steps": 7064, "loss": 0.7805, "reward": null, "learning_rate": 1.9399818923263056e-05, "epoch": 1.14, "percentage": 57.19, "elapsed_time": "11:22:59", "remaining_time": "8:31:14"} +{"current_steps": 4040, "total_steps": 7064, "loss": 0.7805, "reward": null, "learning_rate": 1.9399818923263056e-05, "epoch": 1.14, "percentage": 57.19, "elapsed_time": "11:26:52", "remaining_time": "8:34:08"} +{"current_steps": 4040, "total_steps": 7064, "loss": 0.7805, "reward": null, "learning_rate": 1.9399818923263056e-05, "epoch": 1.14, "percentage": 57.19, "elapsed_time": "11:22:59", "remaining_time": "8:31:13"} +{"current_steps": 4050, "total_steps": 7064, "loss": 0.798, "reward": null, "learning_rate": 1.929151690263026e-05, "epoch": 1.15, "percentage": 57.33, "elapsed_time": "11:24:46", "remaining_time": "8:29:36"} +{"current_steps": 4050, "total_steps": 7064, "loss": 0.798, "reward": null, "learning_rate": 1.929151690263026e-05, "epoch": 1.15, "percentage": 57.33, "elapsed_time": "11:24:44", "remaining_time": "8:29:34"} +{"current_steps": 4050, "total_steps": 7064, "loss": 0.798, "reward": null, "learning_rate": 1.929151690263026e-05, "epoch": 1.15, "percentage": 57.33, "elapsed_time": "11:24:45", "remaining_time": "8:29:35"} +{"current_steps": 4050, "total_steps": 7064, "loss": 0.798, "reward": null, "learning_rate": 1.929151690263026e-05, "epoch": 1.15, "percentage": 57.33, "elapsed_time": "11:28:37", "remaining_time": "8:32:28"} +{"current_steps": 4060, "total_steps": 7064, "loss": 0.8183, "reward": null, "learning_rate": 1.918332778834745e-05, "epoch": 1.15, "percentage": 57.47, "elapsed_time": "11:26:29", "remaining_time": "8:27:55"} +{"current_steps": 4060, "total_steps": 7064, "loss": 0.8183, "reward": null, "learning_rate": 1.918332778834745e-05, "epoch": 1.15, "percentage": 57.47, "elapsed_time": "11:30:20", "remaining_time": "8:30:47"} +{"current_steps": 4060, "total_steps": 7064, "loss": 0.8183, "reward": null, "learning_rate": 1.918332778834745e-05, "epoch": 1.15, "percentage": 57.47, "elapsed_time": "11:26:27", "remaining_time": "8:27:54"} +{"current_steps": 4060, "total_steps": 7064, "loss": 0.8183, "reward": null, "learning_rate": 1.918332778834745e-05, "epoch": 1.15, "percentage": 57.47, "elapsed_time": "11:26:28", "remaining_time": "8:27:55"} +{"current_steps": 4070, "total_steps": 7064, "loss": 0.8106, "reward": null, "learning_rate": 1.9075253720254217e-05, "epoch": 1.15, "percentage": 57.62, "elapsed_time": "11:28:10", "remaining_time": "8:26:14"} +{"current_steps": 4070, "total_steps": 7064, "loss": 0.8106, "reward": null, "learning_rate": 1.9075253720254217e-05, "epoch": 1.15, "percentage": 57.62, "elapsed_time": "11:32:01", "remaining_time": "8:29:04"} +{"current_steps": 4070, "total_steps": 7064, "loss": 0.8106, "reward": null, "learning_rate": 1.9075253720254217e-05, "epoch": 1.15, "percentage": 57.62, "elapsed_time": "11:28:08", "remaining_time": "8:26:12"} +{"current_steps": 4070, "total_steps": 7064, "loss": 0.8106, "reward": null, "learning_rate": 1.9075253720254217e-05, "epoch": 1.15, "percentage": 57.62, "elapsed_time": "11:28:09", "remaining_time": "8:26:13"} +{"current_steps": 4080, "total_steps": 7064, "loss": 0.7918, "reward": null, "learning_rate": 1.8967296835914643e-05, "epoch": 1.16, "percentage": 57.76, "elapsed_time": "11:29:49", "remaining_time": "8:24:31"} +{"current_steps": 4080, "total_steps": 7064, "loss": 0.7918, "reward": null, "learning_rate": 1.8967296835914643e-05, "epoch": 1.16, "percentage": 57.76, "elapsed_time": "11:33:41", "remaining_time": "8:27:20"} +{"current_steps": 4080, "total_steps": 7064, "loss": 0.7918, "reward": null, "learning_rate": 1.8967296835914643e-05, "epoch": 1.16, "percentage": 57.76, "elapsed_time": "11:29:47", "remaining_time": "8:24:29"} +{"current_steps": 4080, "total_steps": 7064, "loss": 0.7918, "reward": null, "learning_rate": 1.8967296835914643e-05, "epoch": 1.16, "percentage": 57.76, "elapsed_time": "11:29:48", "remaining_time": "8:24:30"} +{"current_steps": 4090, "total_steps": 7064, "loss": 0.779, "reward": null, "learning_rate": 1.885945927057511e-05, "epoch": 1.16, "percentage": 57.9, "elapsed_time": "11:31:37", "remaining_time": "8:22:54"} +{"current_steps": 4090, "total_steps": 7064, "loss": 0.779, "reward": null, "learning_rate": 1.885945927057511e-05, "epoch": 1.16, "percentage": 57.9, "elapsed_time": "11:35:28", "remaining_time": "8:25:42"} +{"current_steps": 4090, "total_steps": 7064, "loss": 0.779, "reward": null, "learning_rate": 1.885945927057511e-05, "epoch": 1.16, "percentage": 57.9, "elapsed_time": "11:31:36", "remaining_time": "8:22:53"} +{"current_steps": 4090, "total_steps": 7064, "loss": 0.779, "reward": null, "learning_rate": 1.885945927057511e-05, "epoch": 1.16, "percentage": 57.9, "elapsed_time": "11:31:35", "remaining_time": "8:22:52"} +{"current_steps": 4100, "total_steps": 7064, "loss": 0.7881, "reward": null, "learning_rate": 1.8751743157122003e-05, "epoch": 1.16, "percentage": 58.04, "elapsed_time": "11:33:20", "remaining_time": "8:21:13"} +{"current_steps": 4100, "total_steps": 7064, "loss": 0.7881, "reward": null, "learning_rate": 1.8751743157122003e-05, "epoch": 1.16, "percentage": 58.04, "elapsed_time": "11:37:11", "remaining_time": "8:24:01"} +{"current_steps": 4100, "total_steps": 7064, "loss": 0.7881, "reward": null, "learning_rate": 1.8751743157122003e-05, "epoch": 1.16, "percentage": 58.04, "elapsed_time": "11:33:18", "remaining_time": "8:21:12"} +{"current_steps": 4100, "total_steps": 7064, "loss": 0.7881, "reward": null, "learning_rate": 1.8751743157122003e-05, "epoch": 1.16, "percentage": 58.04, "elapsed_time": "11:33:19", "remaining_time": "8:21:13"} +{"current_steps": 4110, "total_steps": 7064, "loss": 0.7952, "reward": null, "learning_rate": 1.8644150626039534e-05, "epoch": 1.16, "percentage": 58.18, "elapsed_time": "11:35:06", "remaining_time": "8:19:35"} +{"current_steps": 4110, "total_steps": 7064, "loss": 0.7952, "reward": null, "learning_rate": 1.8644150626039534e-05, "epoch": 1.16, "percentage": 58.18, "elapsed_time": "11:38:57", "remaining_time": "8:22:21"} +{"current_steps": 4110, "total_steps": 7064, "loss": 0.7952, "reward": null, "learning_rate": 1.8644150626039534e-05, "epoch": 1.16, "percentage": 58.18, "elapsed_time": "11:35:05", "remaining_time": "8:19:34"} +{"current_steps": 4110, "total_steps": 7064, "loss": 0.7952, "reward": null, "learning_rate": 1.8644150626039534e-05, "epoch": 1.16, "percentage": 58.18, "elapsed_time": "11:35:04", "remaining_time": "8:19:34"} +{"current_steps": 4120, "total_steps": 7064, "loss": 0.7971, "reward": null, "learning_rate": 1.8536683805367656e-05, "epoch": 1.17, "percentage": 58.32, "elapsed_time": "11:40:42", "remaining_time": "8:20:42"} +{"current_steps": 4120, "total_steps": 7064, "loss": 0.7971, "reward": null, "learning_rate": 1.8536683805367656e-05, "epoch": 1.17, "percentage": 58.32, "elapsed_time": "11:36:51", "remaining_time": "8:17:57"} +{"current_steps": 4120, "total_steps": 7064, "loss": 0.7971, "reward": null, "learning_rate": 1.8536683805367656e-05, "epoch": 1.17, "percentage": 58.32, "elapsed_time": "11:36:50", "remaining_time": "8:17:56"} +{"current_steps": 4120, "total_steps": 7064, "loss": 0.7971, "reward": null, "learning_rate": 1.8536683805367656e-05, "epoch": 1.17, "percentage": 58.32, "elapsed_time": "11:36:49", "remaining_time": "8:17:55"} +{"current_steps": 4130, "total_steps": 7064, "loss": 0.8005, "reward": null, "learning_rate": 1.8429344820659892e-05, "epoch": 1.17, "percentage": 58.47, "elapsed_time": "11:38:32", "remaining_time": "8:16:14"} +{"current_steps": 4130, "total_steps": 7064, "loss": 0.8005, "reward": null, "learning_rate": 1.8429344820659892e-05, "epoch": 1.17, "percentage": 58.47, "elapsed_time": "11:42:23", "remaining_time": "8:18:59"} +{"current_steps": 4130, "total_steps": 7064, "loss": 0.8005, "reward": null, "learning_rate": 1.8429344820659892e-05, "epoch": 1.17, "percentage": 58.47, "elapsed_time": "11:38:30", "remaining_time": "8:16:13"} +{"current_steps": 4130, "total_steps": 7064, "loss": 0.8005, "reward": null, "learning_rate": 1.8429344820659892e-05, "epoch": 1.17, "percentage": 58.47, "elapsed_time": "11:38:31", "remaining_time": "8:16:14"} +{"current_steps": 4140, "total_steps": 7064, "loss": 0.8014, "reward": null, "learning_rate": 1.832213579494137e-05, "epoch": 1.17, "percentage": 58.61, "elapsed_time": "11:40:15", "remaining_time": "8:14:34"} +{"current_steps": 4140, "total_steps": 7064, "loss": 0.8014, "reward": null, "learning_rate": 1.832213579494137e-05, "epoch": 1.17, "percentage": 58.61, "elapsed_time": "11:40:13", "remaining_time": "8:14:32"} +{"current_steps": 4140, "total_steps": 7064, "loss": 0.8014, "reward": null, "learning_rate": 1.832213579494137e-05, "epoch": 1.17, "percentage": 58.61, "elapsed_time": "11:40:13", "remaining_time": "8:14:33"} +{"current_steps": 4140, "total_steps": 7064, "loss": 0.8014, "reward": null, "learning_rate": 1.832213579494137e-05, "epoch": 1.17, "percentage": 58.61, "elapsed_time": "11:44:06", "remaining_time": "8:17:17"} +{"current_steps": 4150, "total_steps": 7064, "loss": 0.7883, "reward": null, "learning_rate": 1.8215058848666765e-05, "epoch": 1.17, "percentage": 58.75, "elapsed_time": "11:45:48", "remaining_time": "8:15:35"} +{"current_steps": 4150, "total_steps": 7064, "loss": 0.7883, "reward": null, "learning_rate": 1.8215058848666765e-05, "epoch": 1.17, "percentage": 58.75, "elapsed_time": "11:41:57", "remaining_time": "8:12:53"} +{"current_steps": 4150, "total_steps": 7064, "loss": 0.7883, "reward": null, "learning_rate": 1.8215058848666765e-05, "epoch": 1.17, "percentage": 58.75, "elapsed_time": "11:41:56", "remaining_time": "8:12:52"} +{"current_steps": 4150, "total_steps": 7064, "loss": 0.7883, "reward": null, "learning_rate": 1.8215058848666765e-05, "epoch": 1.17, "percentage": 58.75, "elapsed_time": "11:41:55", "remaining_time": "8:12:52"} +{"current_steps": 4160, "total_steps": 7064, "loss": 0.7887, "reward": null, "learning_rate": 1.810811609967844e-05, "epoch": 1.18, "percentage": 58.89, "elapsed_time": "11:43:42", "remaining_time": "8:11:14"} +{"current_steps": 4160, "total_steps": 7064, "loss": 0.7887, "reward": null, "learning_rate": 1.810811609967844e-05, "epoch": 1.18, "percentage": 58.89, "elapsed_time": "11:47:33", "remaining_time": "8:13:55"} +{"current_steps": 4160, "total_steps": 7064, "loss": 0.7887, "reward": null, "learning_rate": 1.810811609967844e-05, "epoch": 1.18, "percentage": 58.89, "elapsed_time": "11:43:40", "remaining_time": "8:11:13"} +{"current_steps": 4160, "total_steps": 7064, "loss": 0.7887, "reward": null, "learning_rate": 1.810811609967844e-05, "epoch": 1.18, "percentage": 58.89, "elapsed_time": "11:43:40", "remaining_time": "8:11:12"} +{"current_steps": 4170, "total_steps": 7064, "loss": 0.7719, "reward": null, "learning_rate": 1.8001309663164457e-05, "epoch": 1.18, "percentage": 59.03, "elapsed_time": "11:45:21", "remaining_time": "8:09:31"} +{"current_steps": 4170, "total_steps": 7064, "loss": 0.7719, "reward": null, "learning_rate": 1.8001309663164457e-05, "epoch": 1.18, "percentage": 59.03, "elapsed_time": "11:45:20", "remaining_time": "8:09:30"} +{"current_steps": 4170, "total_steps": 7064, "loss": 0.7719, "reward": null, "learning_rate": 1.8001309663164457e-05, "epoch": 1.18, "percentage": 59.03, "elapsed_time": "11:45:19", "remaining_time": "8:09:30"} +{"current_steps": 4170, "total_steps": 7064, "loss": 0.7719, "reward": null, "learning_rate": 1.8001309663164457e-05, "epoch": 1.18, "percentage": 59.03, "elapsed_time": "11:49:13", "remaining_time": "8:12:12"} +{"current_steps": 4180, "total_steps": 7064, "loss": 0.8098, "reward": null, "learning_rate": 1.7894641651616838e-05, "epoch": 1.18, "percentage": 59.17, "elapsed_time": "11:47:04", "remaining_time": "8:07:50"} +{"current_steps": 4180, "total_steps": 7064, "loss": 0.8098, "reward": null, "learning_rate": 1.7894641651616838e-05, "epoch": 1.18, "percentage": 59.17, "elapsed_time": "11:50:55", "remaining_time": "8:10:30"} +{"current_steps": 4180, "total_steps": 7064, "loss": 0.8098, "reward": null, "learning_rate": 1.7894641651616838e-05, "epoch": 1.18, "percentage": 59.17, "elapsed_time": "11:47:02", "remaining_time": "8:07:49"} +{"current_steps": 4180, "total_steps": 7064, "loss": 0.8098, "reward": null, "learning_rate": 1.7894641651616838e-05, "epoch": 1.18, "percentage": 59.17, "elapsed_time": "11:47:03", "remaining_time": "8:07:49"} +{"current_steps": 4190, "total_steps": 7064, "loss": 0.7909, "reward": null, "learning_rate": 1.7788114174789706e-05, "epoch": 1.19, "percentage": 59.31, "elapsed_time": "11:48:47", "remaining_time": "8:06:10"} +{"current_steps": 4190, "total_steps": 7064, "loss": 0.7909, "reward": null, "learning_rate": 1.7788114174789706e-05, "epoch": 1.19, "percentage": 59.31, "elapsed_time": "11:52:39", "remaining_time": "8:08:49"} +{"current_steps": 4190, "total_steps": 7064, "loss": 0.7909, "reward": null, "learning_rate": 1.7788114174789706e-05, "epoch": 1.19, "percentage": 59.31, "elapsed_time": "11:48:45", "remaining_time": "8:06:09"} +{"current_steps": 4190, "total_steps": 7064, "loss": 0.7909, "reward": null, "learning_rate": 1.7788114174789706e-05, "epoch": 1.19, "percentage": 59.31, "elapsed_time": "11:48:46", "remaining_time": "8:06:09"} +{"current_steps": 4200, "total_steps": 7064, "loss": 0.7791, "reward": null, "learning_rate": 1.7681729339657626e-05, "epoch": 1.19, "percentage": 59.46, "elapsed_time": "11:50:30", "remaining_time": "8:04:29"} +{"current_steps": 4200, "total_steps": 7064, "loss": 0.7791, "reward": null, "learning_rate": 1.7681729339657626e-05, "epoch": 1.19, "percentage": 59.46, "elapsed_time": "11:54:22", "remaining_time": "8:07:08"} +{"current_steps": 4200, "total_steps": 7064, "loss": 0.7791, "reward": null, "learning_rate": 1.7681729339657626e-05, "epoch": 1.19, "percentage": 59.46, "elapsed_time": "11:50:31", "remaining_time": "8:04:30"} +{"current_steps": 4200, "total_steps": 7064, "loss": 0.7791, "reward": null, "learning_rate": 1.7681729339657626e-05, "epoch": 1.19, "percentage": 59.46, "elapsed_time": "11:50:29", "remaining_time": "8:04:29"} +{"current_steps": 4210, "total_steps": 7064, "loss": 0.7946, "reward": null, "learning_rate": 1.7575489250373867e-05, "epoch": 1.19, "percentage": 59.6, "elapsed_time": "11:52:11", "remaining_time": "8:02:48"} +{"current_steps": 4210, "total_steps": 7064, "loss": 0.7946, "reward": null, "learning_rate": 1.7575489250373867e-05, "epoch": 1.19, "percentage": 59.6, "elapsed_time": "11:52:10", "remaining_time": "8:02:47"} +{"current_steps": 4210, "total_steps": 7064, "loss": 0.7946, "reward": null, "learning_rate": 1.7575489250373867e-05, "epoch": 1.19, "percentage": 59.6, "elapsed_time": "11:52:09", "remaining_time": "8:02:47"} +{"current_steps": 4210, "total_steps": 7064, "loss": 0.7946, "reward": null, "learning_rate": 1.7575489250373867e-05, "epoch": 1.19, "percentage": 59.6, "elapsed_time": "11:56:03", "remaining_time": "8:05:25"} +{"current_steps": 4220, "total_steps": 7064, "loss": 0.7973, "reward": null, "learning_rate": 1.746939600822883e-05, "epoch": 1.19, "percentage": 59.74, "elapsed_time": "11:53:58", "remaining_time": "8:01:10"} +{"current_steps": 4220, "total_steps": 7064, "loss": 0.7973, "reward": null, "learning_rate": 1.746939600822883e-05, "epoch": 1.19, "percentage": 59.74, "elapsed_time": "11:53:57", "remaining_time": "8:01:09"} +{"current_steps": 4220, "total_steps": 7064, "loss": 0.7973, "reward": null, "learning_rate": 1.746939600822883e-05, "epoch": 1.19, "percentage": 59.74, "elapsed_time": "11:53:56", "remaining_time": "8:01:08"} +{"current_steps": 4220, "total_steps": 7064, "loss": 0.7973, "reward": null, "learning_rate": 1.746939600822883e-05, "epoch": 1.19, "percentage": 59.74, "elapsed_time": "11:57:49", "remaining_time": "8:03:46"} +{"current_steps": 4230, "total_steps": 7064, "loss": 0.7961, "reward": null, "learning_rate": 1.7363451711608445e-05, "epoch": 1.2, "percentage": 59.88, "elapsed_time": "11:55:38", "remaining_time": "7:59:27"} +{"current_steps": 4230, "total_steps": 7064, "loss": 0.7961, "reward": null, "learning_rate": 1.7363451711608445e-05, "epoch": 1.2, "percentage": 59.88, "elapsed_time": "11:55:36", "remaining_time": "7:59:26"} +{"current_steps": 4230, "total_steps": 7064, "loss": 0.7961, "reward": null, "learning_rate": 1.7363451711608445e-05, "epoch": 1.2, "percentage": 59.88, "elapsed_time": "11:55:37", "remaining_time": "7:59:27"} +{"current_steps": 4230, "total_steps": 7064, "loss": 0.7961, "reward": null, "learning_rate": 1.7363451711608445e-05, "epoch": 1.2, "percentage": 59.88, "elapsed_time": "11:59:29", "remaining_time": "8:02:02"} +{"current_steps": 4240, "total_steps": 7064, "loss": 0.797, "reward": null, "learning_rate": 1.7257658455952747e-05, "epoch": 1.2, "percentage": 60.02, "elapsed_time": "11:57:21", "remaining_time": "7:57:47"} +{"current_steps": 4240, "total_steps": 7064, "loss": 0.797, "reward": null, "learning_rate": 1.7257658455952747e-05, "epoch": 1.2, "percentage": 60.02, "elapsed_time": "12:01:12", "remaining_time": "8:00:21"} +{"current_steps": 4240, "total_steps": 7064, "loss": 0.797, "reward": null, "learning_rate": 1.7257658455952747e-05, "epoch": 1.2, "percentage": 60.02, "elapsed_time": "11:57:20", "remaining_time": "7:57:46"} +{"current_steps": 4240, "total_steps": 7064, "loss": 0.797, "reward": null, "learning_rate": 1.7257658455952747e-05, "epoch": 1.2, "percentage": 60.02, "elapsed_time": "11:57:19", "remaining_time": "7:57:45"} +{"current_steps": 4250, "total_steps": 7064, "loss": 0.7961, "reward": null, "learning_rate": 1.715201833371432e-05, "epoch": 1.2, "percentage": 60.16, "elapsed_time": "12:02:57", "remaining_time": "7:58:41"} +{"current_steps": 4250, "total_steps": 7064, "loss": 0.7961, "reward": null, "learning_rate": 1.715201833371432e-05, "epoch": 1.2, "percentage": 60.16, "elapsed_time": "11:59:04", "remaining_time": "7:56:06"} +{"current_steps": 4250, "total_steps": 7064, "loss": 0.7961, "reward": null, "learning_rate": 1.715201833371432e-05, "epoch": 1.2, "percentage": 60.16, "elapsed_time": "11:59:05", "remaining_time": "7:56:07"} +{"current_steps": 4250, "total_steps": 7064, "loss": 0.7961, "reward": null, "learning_rate": 1.715201833371432e-05, "epoch": 1.2, "percentage": 60.16, "elapsed_time": "11:59:06", "remaining_time": "7:56:08"} +{"current_steps": 4260, "total_steps": 7064, "loss": 0.7918, "reward": null, "learning_rate": 1.7046533434317008e-05, "epoch": 1.21, "percentage": 60.31, "elapsed_time": "12:00:44", "remaining_time": "7:54:23"} +{"current_steps": 4260, "total_steps": 7064, "loss": 0.7918, "reward": null, "learning_rate": 1.7046533434317008e-05, "epoch": 1.21, "percentage": 60.31, "elapsed_time": "12:04:35", "remaining_time": "7:56:56"} +{"current_steps": 4260, "total_steps": 7064, "loss": 0.7918, "reward": null, "learning_rate": 1.7046533434317008e-05, "epoch": 1.21, "percentage": 60.31, "elapsed_time": "12:00:42", "remaining_time": "7:54:22"} +{"current_steps": 4260, "total_steps": 7064, "loss": 0.7918, "reward": null, "learning_rate": 1.7046533434317008e-05, "epoch": 1.21, "percentage": 60.31, "elapsed_time": "12:00:42", "remaining_time": "7:54:23"} +{"current_steps": 4270, "total_steps": 7064, "loss": 0.7868, "reward": null, "learning_rate": 1.6941205844114522e-05, "epoch": 1.21, "percentage": 60.45, "elapsed_time": "12:02:28", "remaining_time": "7:52:44"} +{"current_steps": 4270, "total_steps": 7064, "loss": 0.7868, "reward": null, "learning_rate": 1.6941205844114522e-05, "epoch": 1.21, "percentage": 60.45, "elapsed_time": "12:06:20", "remaining_time": "7:55:15"} +{"current_steps": 4270, "total_steps": 7064, "loss": 0.7868, "reward": null, "learning_rate": 1.6941205844114522e-05, "epoch": 1.21, "percentage": 60.45, "elapsed_time": "12:02:26", "remaining_time": "7:52:43"} +{"current_steps": 4270, "total_steps": 7064, "loss": 0.7868, "reward": null, "learning_rate": 1.6941205844114522e-05, "epoch": 1.21, "percentage": 60.45, "elapsed_time": "12:02:27", "remaining_time": "7:52:43"} +{"current_steps": 4280, "total_steps": 7064, "loss": 0.7843, "reward": null, "learning_rate": 1.683603764634923e-05, "epoch": 1.21, "percentage": 60.59, "elapsed_time": "12:04:10", "remaining_time": "7:51:03"} +{"current_steps": 4280, "total_steps": 7064, "loss": 0.7843, "reward": null, "learning_rate": 1.683603764634923e-05, "epoch": 1.21, "percentage": 60.59, "elapsed_time": "12:04:12", "remaining_time": "7:51:04"} +{"current_steps": 4280, "total_steps": 7064, "loss": 0.7843, "reward": null, "learning_rate": 1.683603764634923e-05, "epoch": 1.21, "percentage": 60.59, "elapsed_time": "12:04:11", "remaining_time": "7:51:03"} +{"current_steps": 4280, "total_steps": 7064, "loss": 0.7843, "reward": null, "learning_rate": 1.683603764634923e-05, "epoch": 1.21, "percentage": 60.59, "elapsed_time": "12:08:03", "remaining_time": "7:53:34"} +{"current_steps": 4290, "total_steps": 7064, "loss": 0.7968, "reward": null, "learning_rate": 1.6731030921110903e-05, "epoch": 1.21, "percentage": 60.73, "elapsed_time": "12:05:52", "remaining_time": "7:49:21"} +{"current_steps": 4290, "total_steps": 7064, "loss": 0.7968, "reward": null, "learning_rate": 1.6731030921110903e-05, "epoch": 1.21, "percentage": 60.73, "elapsed_time": "12:09:43", "remaining_time": "7:51:51"} +{"current_steps": 4290, "total_steps": 7064, "loss": 0.7968, "reward": null, "learning_rate": 1.6731030921110903e-05, "epoch": 1.21, "percentage": 60.73, "elapsed_time": "12:05:50", "remaining_time": "7:49:20"} +{"current_steps": 4290, "total_steps": 7064, "loss": 0.7968, "reward": null, "learning_rate": 1.6731030921110903e-05, "epoch": 1.21, "percentage": 60.73, "elapsed_time": "12:05:51", "remaining_time": "7:49:21"} +{"current_steps": 4300, "total_steps": 7064, "loss": 0.7917, "reward": null, "learning_rate": 1.6626187745295608e-05, "epoch": 1.22, "percentage": 60.87, "elapsed_time": "12:11:27", "remaining_time": "7:50:10"} +{"current_steps": 4300, "total_steps": 7064, "loss": 0.7917, "reward": null, "learning_rate": 1.6626187745295608e-05, "epoch": 1.22, "percentage": 60.87, "elapsed_time": "12:07:33", "remaining_time": "7:47:40"} +{"current_steps": 4300, "total_steps": 7064, "loss": 0.7917, "reward": null, "learning_rate": 1.6626187745295608e-05, "epoch": 1.22, "percentage": 60.87, "elapsed_time": "12:07:34", "remaining_time": "7:47:40"} +{"current_steps": 4300, "total_steps": 7064, "loss": 0.7917, "reward": null, "learning_rate": 1.6626187745295608e-05, "epoch": 1.22, "percentage": 60.87, "elapsed_time": "12:07:35", "remaining_time": "7:47:41"} +{"current_steps": 4310, "total_steps": 7064, "loss": 0.7872, "reward": null, "learning_rate": 1.65215101925646e-05, "epoch": 1.22, "percentage": 61.01, "elapsed_time": "12:13:08", "remaining_time": "7:48:27"} +{"current_steps": 4310, "total_steps": 7064, "loss": 0.7872, "reward": null, "learning_rate": 1.65215101925646e-05, "epoch": 1.22, "percentage": 61.01, "elapsed_time": "12:09:15", "remaining_time": "7:45:58"} +{"current_steps": 4310, "total_steps": 7064, "loss": 0.7872, "reward": null, "learning_rate": 1.65215101925646e-05, "epoch": 1.22, "percentage": 61.01, "elapsed_time": "12:09:17", "remaining_time": "7:45:59"} +{"current_steps": 4310, "total_steps": 7064, "loss": 0.7872, "reward": null, "learning_rate": 1.65215101925646e-05, "epoch": 1.22, "percentage": 61.01, "elapsed_time": "12:09:15", "remaining_time": "7:45:59"} +{"current_steps": 4320, "total_steps": 7064, "loss": 0.777, "reward": null, "learning_rate": 1.641700033330336e-05, "epoch": 1.22, "percentage": 61.16, "elapsed_time": "12:10:58", "remaining_time": "7:44:18"} +{"current_steps": 4320, "total_steps": 7064, "loss": 0.777, "reward": null, "learning_rate": 1.641700033330336e-05, "epoch": 1.22, "percentage": 61.16, "elapsed_time": "12:14:50", "remaining_time": "7:46:45"} +{"current_steps": 4320, "total_steps": 7064, "loss": 0.777, "reward": null, "learning_rate": 1.641700033330336e-05, "epoch": 1.22, "percentage": 61.16, "elapsed_time": "12:10:56", "remaining_time": "7:44:17"} +{"current_steps": 4320, "total_steps": 7064, "loss": 0.777, "reward": null, "learning_rate": 1.641700033330336e-05, "epoch": 1.22, "percentage": 61.16, "elapsed_time": "12:10:57", "remaining_time": "7:44:17"} +{"current_steps": 4330, "total_steps": 7064, "loss": 0.8049, "reward": null, "learning_rate": 1.6312660234580585e-05, "epoch": 1.23, "percentage": 61.3, "elapsed_time": "12:12:41", "remaining_time": "7:42:37"} +{"current_steps": 4330, "total_steps": 7064, "loss": 0.8049, "reward": null, "learning_rate": 1.6312660234580585e-05, "epoch": 1.23, "percentage": 61.3, "elapsed_time": "12:12:40", "remaining_time": "7:42:36"} +{"current_steps": 4330, "total_steps": 7064, "loss": 0.8049, "reward": null, "learning_rate": 1.6312660234580585e-05, "epoch": 1.23, "percentage": 61.3, "elapsed_time": "12:12:39", "remaining_time": "7:42:36"} +{"current_steps": 4330, "total_steps": 7064, "loss": 0.8049, "reward": null, "learning_rate": 1.6312660234580585e-05, "epoch": 1.23, "percentage": 61.3, "elapsed_time": "12:16:32", "remaining_time": "7:45:03"} +{"current_steps": 4340, "total_steps": 7064, "loss": 0.7897, "reward": null, "learning_rate": 1.6208491960107324e-05, "epoch": 1.23, "percentage": 61.44, "elapsed_time": "12:14:26", "remaining_time": "7:40:58"} +{"current_steps": 4340, "total_steps": 7064, "loss": 0.7897, "reward": null, "learning_rate": 1.6208491960107324e-05, "epoch": 1.23, "percentage": 61.44, "elapsed_time": "12:18:17", "remaining_time": "7:43:23"} +{"current_steps": 4340, "total_steps": 7064, "loss": 0.7897, "reward": null, "learning_rate": 1.6208491960107324e-05, "epoch": 1.23, "percentage": 61.44, "elapsed_time": "12:14:25", "remaining_time": "7:40:57"} +{"current_steps": 4340, "total_steps": 7064, "loss": 0.7897, "reward": null, "learning_rate": 1.6208491960107324e-05, "epoch": 1.23, "percentage": 61.44, "elapsed_time": "12:14:24", "remaining_time": "7:40:57"} +{"current_steps": 4350, "total_steps": 7064, "loss": 0.792, "reward": null, "learning_rate": 1.6104497570196193e-05, "epoch": 1.23, "percentage": 61.58, "elapsed_time": "12:16:09", "remaining_time": "7:39:17"} +{"current_steps": 4350, "total_steps": 7064, "loss": 0.792, "reward": null, "learning_rate": 1.6104497570196193e-05, "epoch": 1.23, "percentage": 61.58, "elapsed_time": "12:20:01", "remaining_time": "7:41:42"} +{"current_steps": 4350, "total_steps": 7064, "loss": 0.792, "reward": null, "learning_rate": 1.6104497570196193e-05, "epoch": 1.23, "percentage": 61.58, "elapsed_time": "12:16:08", "remaining_time": "7:39:17"} +{"current_steps": 4350, "total_steps": 7064, "loss": 0.792, "reward": null, "learning_rate": 1.6104497570196193e-05, "epoch": 1.23, "percentage": 61.58, "elapsed_time": "12:16:07", "remaining_time": "7:39:16"} +{"current_steps": 4360, "total_steps": 7064, "loss": 0.7866, "reward": null, "learning_rate": 1.600067912172057e-05, "epoch": 1.23, "percentage": 61.72, "elapsed_time": "12:21:43", "remaining_time": "7:40:00"} +{"current_steps": 4360, "total_steps": 7064, "loss": 0.7866, "reward": null, "learning_rate": 1.600067912172057e-05, "epoch": 1.23, "percentage": 61.72, "elapsed_time": "12:17:50", "remaining_time": "7:37:36"} +{"current_steps": 4360, "total_steps": 7064, "loss": 0.7866, "reward": null, "learning_rate": 1.600067912172057e-05, "epoch": 1.23, "percentage": 61.72, "elapsed_time": "12:17:49", "remaining_time": "7:37:35"} +{"current_steps": 4360, "total_steps": 7064, "loss": 0.7866, "reward": null, "learning_rate": 1.600067912172057e-05, "epoch": 1.23, "percentage": 61.72, "elapsed_time": "12:17:51", "remaining_time": "7:37:36"} +{"current_steps": 4370, "total_steps": 7064, "loss": 0.8061, "reward": null, "learning_rate": 1.5897038668073965e-05, "epoch": 1.24, "percentage": 61.86, "elapsed_time": "12:19:32", "remaining_time": "7:35:54"} +{"current_steps": 4370, "total_steps": 7064, "loss": 0.8061, "reward": null, "learning_rate": 1.5897038668073965e-05, "epoch": 1.24, "percentage": 61.86, "elapsed_time": "12:23:24", "remaining_time": "7:38:17"} +{"current_steps": 4370, "total_steps": 7064, "loss": 0.8061, "reward": null, "learning_rate": 1.5897038668073965e-05, "epoch": 1.24, "percentage": 61.86, "elapsed_time": "12:19:31", "remaining_time": "7:35:54"} +{"current_steps": 4370, "total_steps": 7064, "loss": 0.8061, "reward": null, "learning_rate": 1.5897038668073965e-05, "epoch": 1.24, "percentage": 61.86, "elapsed_time": "12:19:30", "remaining_time": "7:35:53"} +{"current_steps": 4380, "total_steps": 7064, "loss": 0.777, "reward": null, "learning_rate": 1.5793578259129355e-05, "epoch": 1.24, "percentage": 62.0, "elapsed_time": "12:21:15", "remaining_time": "7:34:14"} +{"current_steps": 4380, "total_steps": 7064, "loss": 0.777, "reward": null, "learning_rate": 1.5793578259129355e-05, "epoch": 1.24, "percentage": 62.0, "elapsed_time": "12:25:07", "remaining_time": "7:36:35"} +{"current_steps": 4380, "total_steps": 7064, "loss": 0.777, "reward": null, "learning_rate": 1.5793578259129355e-05, "epoch": 1.24, "percentage": 62.0, "elapsed_time": "12:21:14", "remaining_time": "7:34:13"} +{"current_steps": 4380, "total_steps": 7064, "loss": 0.777, "reward": null, "learning_rate": 1.5793578259129355e-05, "epoch": 1.24, "percentage": 62.0, "elapsed_time": "12:21:13", "remaining_time": "7:34:12"} +{"current_steps": 4390, "total_steps": 7064, "loss": 0.7883, "reward": null, "learning_rate": 1.5690299941198706e-05, "epoch": 1.24, "percentage": 62.15, "elapsed_time": "12:22:57", "remaining_time": "7:32:32"} +{"current_steps": 4390, "total_steps": 7064, "loss": 0.7883, "reward": null, "learning_rate": 1.5690299941198706e-05, "epoch": 1.24, "percentage": 62.15, "elapsed_time": "12:22:55", "remaining_time": "7:32:31"} +{"current_steps": 4390, "total_steps": 7064, "loss": 0.7883, "reward": null, "learning_rate": 1.5690299941198706e-05, "epoch": 1.24, "percentage": 62.15, "elapsed_time": "12:22:56", "remaining_time": "7:32:32"} +{"current_steps": 4390, "total_steps": 7064, "loss": 0.7883, "reward": null, "learning_rate": 1.5690299941198706e-05, "epoch": 1.24, "percentage": 62.15, "elapsed_time": "12:26:48", "remaining_time": "7:34:53"} +{"current_steps": 4400, "total_steps": 7064, "loss": 0.7897, "reward": null, "learning_rate": 1.558720575699242e-05, "epoch": 1.25, "percentage": 62.29, "elapsed_time": "12:28:35", "remaining_time": "7:33:14"} +{"current_steps": 4400, "total_steps": 7064, "loss": 0.7897, "reward": null, "learning_rate": 1.558720575699242e-05, "epoch": 1.25, "percentage": 62.29, "elapsed_time": "12:24:43", "remaining_time": "7:30:53"} +{"current_steps": 4400, "total_steps": 7064, "loss": 0.7897, "reward": null, "learning_rate": 1.558720575699242e-05, "epoch": 1.25, "percentage": 62.29, "elapsed_time": "12:24:42", "remaining_time": "7:30:53"} +{"current_steps": 4400, "total_steps": 7064, "loss": 0.7897, "reward": null, "learning_rate": 1.558720575699242e-05, "epoch": 1.25, "percentage": 62.29, "elapsed_time": "12:24:44", "remaining_time": "7:30:54"} +{"current_steps": 4410, "total_steps": 7064, "loss": 0.8014, "reward": null, "learning_rate": 1.548429774557901e-05, "epoch": 1.25, "percentage": 62.43, "elapsed_time": "12:26:30", "remaining_time": "7:29:15"} +{"current_steps": 4410, "total_steps": 7064, "loss": 0.8014, "reward": null, "learning_rate": 1.548429774557901e-05, "epoch": 1.25, "percentage": 62.43, "elapsed_time": "12:30:21", "remaining_time": "7:31:34"} +{"current_steps": 4410, "total_steps": 7064, "loss": 0.8014, "reward": null, "learning_rate": 1.548429774557901e-05, "epoch": 1.25, "percentage": 62.43, "elapsed_time": "12:26:29", "remaining_time": "7:29:14"} +{"current_steps": 4410, "total_steps": 7064, "loss": 0.8014, "reward": null, "learning_rate": 1.548429774557901e-05, "epoch": 1.25, "percentage": 62.43, "elapsed_time": "12:26:28", "remaining_time": "7:29:14"} +{"current_steps": 4420, "total_steps": 7064, "loss": 0.7882, "reward": null, "learning_rate": 1.5381577942344688e-05, "epoch": 1.25, "percentage": 62.57, "elapsed_time": "12:28:15", "remaining_time": "7:27:35"} +{"current_steps": 4420, "total_steps": 7064, "loss": 0.7882, "reward": null, "learning_rate": 1.5381577942344688e-05, "epoch": 1.25, "percentage": 62.57, "elapsed_time": "12:32:06", "remaining_time": "7:29:54"} +{"current_steps": 4420, "total_steps": 7064, "loss": 0.7882, "reward": null, "learning_rate": 1.5381577942344688e-05, "epoch": 1.25, "percentage": 62.57, "elapsed_time": "12:28:14", "remaining_time": "7:27:35"} +{"current_steps": 4420, "total_steps": 7064, "loss": 0.7882, "reward": null, "learning_rate": 1.5381577942344688e-05, "epoch": 1.25, "percentage": 62.57, "elapsed_time": "12:28:13", "remaining_time": "7:27:34"} +{"current_steps": 4430, "total_steps": 7064, "loss": 0.7839, "reward": null, "learning_rate": 1.5279048378953222e-05, "epoch": 1.25, "percentage": 62.71, "elapsed_time": "12:29:56", "remaining_time": "7:25:54"} +{"current_steps": 4430, "total_steps": 7064, "loss": 0.7839, "reward": null, "learning_rate": 1.5279048378953222e-05, "epoch": 1.25, "percentage": 62.71, "elapsed_time": "12:29:54", "remaining_time": "7:25:53"} +{"current_steps": 4430, "total_steps": 7064, "loss": 0.7839, "reward": null, "learning_rate": 1.5279048378953222e-05, "epoch": 1.25, "percentage": 62.71, "elapsed_time": "12:29:55", "remaining_time": "7:25:53"} +{"current_steps": 4430, "total_steps": 7064, "loss": 0.7839, "reward": null, "learning_rate": 1.5279048378953222e-05, "epoch": 1.25, "percentage": 62.71, "elapsed_time": "12:33:48", "remaining_time": "7:28:11"} +{"current_steps": 4440, "total_steps": 7064, "loss": 0.794, "reward": null, "learning_rate": 1.517671108330561e-05, "epoch": 1.26, "percentage": 62.85, "elapsed_time": "12:31:34", "remaining_time": "7:24:10"} +{"current_steps": 4440, "total_steps": 7064, "loss": 0.794, "reward": null, "learning_rate": 1.517671108330561e-05, "epoch": 1.26, "percentage": 62.85, "elapsed_time": "12:35:26", "remaining_time": "7:26:27"} +{"current_steps": 4440, "total_steps": 7064, "loss": 0.794, "reward": null, "learning_rate": 1.517671108330561e-05, "epoch": 1.26, "percentage": 62.85, "elapsed_time": "12:31:33", "remaining_time": "7:24:09"} +{"current_steps": 4440, "total_steps": 7064, "loss": 0.794, "reward": null, "learning_rate": 1.517671108330561e-05, "epoch": 1.26, "percentage": 62.85, "elapsed_time": "12:31:32", "remaining_time": "7:24:09"} +{"current_steps": 4450, "total_steps": 7064, "loss": 0.7739, "reward": null, "learning_rate": 1.5074568079500109e-05, "epoch": 1.26, "percentage": 63.0, "elapsed_time": "12:33:19", "remaining_time": "7:22:31"} +{"current_steps": 4450, "total_steps": 7064, "loss": 0.7739, "reward": null, "learning_rate": 1.5074568079500109e-05, "epoch": 1.26, "percentage": 63.0, "elapsed_time": "12:37:11", "remaining_time": "7:24:47"} +{"current_steps": 4450, "total_steps": 7064, "loss": 0.7739, "reward": null, "learning_rate": 1.5074568079500109e-05, "epoch": 1.26, "percentage": 63.0, "elapsed_time": "12:33:17", "remaining_time": "7:22:29"} +{"current_steps": 4450, "total_steps": 7064, "loss": 0.7739, "reward": null, "learning_rate": 1.5074568079500109e-05, "epoch": 1.26, "percentage": 63.0, "elapsed_time": "12:33:18", "remaining_time": "7:22:30"} +{"current_steps": 4460, "total_steps": 7064, "loss": 0.7911, "reward": null, "learning_rate": 1.497262138779208e-05, "epoch": 1.26, "percentage": 63.14, "elapsed_time": "12:35:00", "remaining_time": "7:20:48"} +{"current_steps": 4460, "total_steps": 7064, "loss": 0.7911, "reward": null, "learning_rate": 1.497262138779208e-05, "epoch": 1.26, "percentage": 63.14, "elapsed_time": "12:38:51", "remaining_time": "7:23:03"} +{"current_steps": 4460, "total_steps": 7064, "loss": 0.7911, "reward": null, "learning_rate": 1.497262138779208e-05, "epoch": 1.26, "percentage": 63.14, "elapsed_time": "12:34:58", "remaining_time": "7:20:47"} +{"current_steps": 4460, "total_steps": 7064, "loss": 0.7911, "reward": null, "learning_rate": 1.497262138779208e-05, "epoch": 1.26, "percentage": 63.14, "elapsed_time": "12:34:59", "remaining_time": "7:20:48"} +{"current_steps": 4470, "total_steps": 7064, "loss": 0.7907, "reward": null, "learning_rate": 1.4870873024554138e-05, "epoch": 1.27, "percentage": 63.28, "elapsed_time": "12:40:33", "remaining_time": "7:21:21"} +{"current_steps": 4470, "total_steps": 7064, "loss": 0.7907, "reward": null, "learning_rate": 1.4870873024554138e-05, "epoch": 1.27, "percentage": 63.28, "elapsed_time": "12:36:42", "remaining_time": "7:19:07"} +{"current_steps": 4470, "total_steps": 7064, "loss": 0.7907, "reward": null, "learning_rate": 1.4870873024554138e-05, "epoch": 1.27, "percentage": 63.28, "elapsed_time": "12:36:41", "remaining_time": "7:19:06"} +{"current_steps": 4470, "total_steps": 7064, "loss": 0.7907, "reward": null, "learning_rate": 1.4870873024554138e-05, "epoch": 1.27, "percentage": 63.28, "elapsed_time": "12:36:40", "remaining_time": "7:19:06"} +{"current_steps": 4480, "total_steps": 7064, "loss": 0.803, "reward": null, "learning_rate": 1.4769325002236183e-05, "epoch": 1.27, "percentage": 63.42, "elapsed_time": "12:42:18", "remaining_time": "7:19:41"} +{"current_steps": 4480, "total_steps": 7064, "loss": 0.803, "reward": null, "learning_rate": 1.4769325002236183e-05, "epoch": 1.27, "percentage": 63.42, "elapsed_time": "12:38:27", "remaining_time": "7:17:27"} +{"current_steps": 4480, "total_steps": 7064, "loss": 0.803, "reward": null, "learning_rate": 1.4769325002236183e-05, "epoch": 1.27, "percentage": 63.42, "elapsed_time": "12:38:26", "remaining_time": "7:17:27"} +{"current_steps": 4480, "total_steps": 7064, "loss": 0.803, "reward": null, "learning_rate": 1.4769325002236183e-05, "epoch": 1.27, "percentage": 63.42, "elapsed_time": "12:38:25", "remaining_time": "7:17:26"} +{"current_steps": 4490, "total_steps": 7064, "loss": 0.8048, "reward": null, "learning_rate": 1.4667979329325651e-05, "epoch": 1.27, "percentage": 63.56, "elapsed_time": "12:40:07", "remaining_time": "7:15:45"} +{"current_steps": 4490, "total_steps": 7064, "loss": 0.8048, "reward": null, "learning_rate": 1.4667979329325651e-05, "epoch": 1.27, "percentage": 63.56, "elapsed_time": "12:40:06", "remaining_time": "7:15:44"} +{"current_steps": 4490, "total_steps": 7064, "loss": 0.8048, "reward": null, "learning_rate": 1.4667979329325651e-05, "epoch": 1.27, "percentage": 63.56, "elapsed_time": "12:40:05", "remaining_time": "7:15:44"} +{"current_steps": 4490, "total_steps": 7064, "loss": 0.8048, "reward": null, "learning_rate": 1.4667979329325651e-05, "epoch": 1.27, "percentage": 63.56, "elapsed_time": "12:43:58", "remaining_time": "7:17:57"} +{"current_steps": 4500, "total_steps": 7064, "loss": 0.7816, "reward": null, "learning_rate": 1.4566838010307754e-05, "epoch": 1.27, "percentage": 63.7, "elapsed_time": "12:41:47", "remaining_time": "7:14:03"} +{"current_steps": 4500, "total_steps": 7064, "loss": 0.7816, "reward": null, "learning_rate": 1.4566838010307754e-05, "epoch": 1.27, "percentage": 63.7, "elapsed_time": "12:45:38", "remaining_time": "7:16:14"} +{"current_steps": 4500, "total_steps": 7064, "loss": 0.7816, "reward": null, "learning_rate": 1.4566838010307754e-05, "epoch": 1.27, "percentage": 63.7, "elapsed_time": "12:41:46", "remaining_time": "7:14:02"} +{"current_steps": 4500, "total_steps": 7064, "loss": 0.7816, "reward": null, "learning_rate": 1.4566838010307754e-05, "epoch": 1.27, "percentage": 63.7, "elapsed_time": "12:41:45", "remaining_time": "7:14:01"} +{"current_steps": 4510, "total_steps": 7064, "loss": 0.7765, "reward": null, "learning_rate": 1.4465903045625878e-05, "epoch": 1.28, "percentage": 63.84, "elapsed_time": "12:47:25", "remaining_time": "7:14:35"} +{"current_steps": 4510, "total_steps": 7064, "loss": 0.7765, "reward": null, "learning_rate": 1.4465903045625878e-05, "epoch": 1.28, "percentage": 63.84, "elapsed_time": "12:43:34", "remaining_time": "7:12:24"} +{"current_steps": 4510, "total_steps": 7064, "loss": 0.7765, "reward": null, "learning_rate": 1.4465903045625878e-05, "epoch": 1.28, "percentage": 63.84, "elapsed_time": "12:43:33", "remaining_time": "7:12:23"} +{"current_steps": 4510, "total_steps": 7064, "loss": 0.7765, "reward": null, "learning_rate": 1.4465903045625878e-05, "epoch": 1.28, "percentage": 63.84, "elapsed_time": "12:43:32", "remaining_time": "7:12:23"} +{"current_steps": 4520, "total_steps": 7064, "loss": 0.7916, "reward": null, "learning_rate": 1.4365176431641958e-05, "epoch": 1.28, "percentage": 63.99, "elapsed_time": "12:45:18", "remaining_time": "7:10:44"} +{"current_steps": 4520, "total_steps": 7064, "loss": 0.7916, "reward": null, "learning_rate": 1.4365176431641958e-05, "epoch": 1.28, "percentage": 63.99, "elapsed_time": "12:49:09", "remaining_time": "7:12:54"} +{"current_steps": 4520, "total_steps": 7064, "loss": 0.7916, "reward": null, "learning_rate": 1.4365176431641958e-05, "epoch": 1.28, "percentage": 63.99, "elapsed_time": "12:45:16", "remaining_time": "7:10:43"} +{"current_steps": 4520, "total_steps": 7064, "loss": 0.7916, "reward": null, "learning_rate": 1.4365176431641958e-05, "epoch": 1.28, "percentage": 63.99, "elapsed_time": "12:45:17", "remaining_time": "7:10:43"} +{"current_steps": 4530, "total_steps": 7064, "loss": 0.8015, "reward": null, "learning_rate": 1.4264660160597057e-05, "epoch": 1.28, "percentage": 64.13, "elapsed_time": "12:47:01", "remaining_time": "7:09:03"} +{"current_steps": 4530, "total_steps": 7064, "loss": 0.8015, "reward": null, "learning_rate": 1.4264660160597057e-05, "epoch": 1.28, "percentage": 64.13, "elapsed_time": "12:46:59", "remaining_time": "7:09:02"} +{"current_steps": 4530, "total_steps": 7064, "loss": 0.8015, "reward": null, "learning_rate": 1.4264660160597057e-05, "epoch": 1.28, "percentage": 64.13, "elapsed_time": "12:50:52", "remaining_time": "7:11:13"} +{"current_steps": 4530, "total_steps": 7064, "loss": 0.8015, "reward": null, "learning_rate": 1.4264660160597057e-05, "epoch": 1.28, "percentage": 64.13, "elapsed_time": "12:47:00", "remaining_time": "7:09:03"} +{"current_steps": 4540, "total_steps": 7064, "loss": 0.7826, "reward": null, "learning_rate": 1.41643562205719e-05, "epoch": 1.29, "percentage": 64.27, "elapsed_time": "12:48:40", "remaining_time": "7:07:20"} +{"current_steps": 4540, "total_steps": 7064, "loss": 0.7826, "reward": null, "learning_rate": 1.41643562205719e-05, "epoch": 1.29, "percentage": 64.27, "elapsed_time": "12:52:32", "remaining_time": "7:09:29"} +{"current_steps": 4540, "total_steps": 7064, "loss": 0.7826, "reward": null, "learning_rate": 1.41643562205719e-05, "epoch": 1.29, "percentage": 64.27, "elapsed_time": "12:48:38", "remaining_time": "7:07:19"} +{"current_steps": 4540, "total_steps": 7064, "loss": 0.7826, "reward": null, "learning_rate": 1.41643562205719e-05, "epoch": 1.29, "percentage": 64.27, "elapsed_time": "12:48:39", "remaining_time": "7:07:20"} +{"current_steps": 4550, "total_steps": 7064, "loss": 0.7834, "reward": null, "learning_rate": 1.4064266595447584e-05, "epoch": 1.29, "percentage": 64.41, "elapsed_time": "12:54:12", "remaining_time": "7:07:46"} +{"current_steps": 4550, "total_steps": 7064, "loss": 0.7834, "reward": null, "learning_rate": 1.4064266595447584e-05, "epoch": 1.29, "percentage": 64.41, "elapsed_time": "12:50:20", "remaining_time": "7:05:38"} +{"current_steps": 4550, "total_steps": 7064, "loss": 0.7834, "reward": null, "learning_rate": 1.4064266595447584e-05, "epoch": 1.29, "percentage": 64.41, "elapsed_time": "12:50:19", "remaining_time": "7:05:37"} +{"current_steps": 4550, "total_steps": 7064, "loss": 0.7834, "reward": null, "learning_rate": 1.4064266595447584e-05, "epoch": 1.29, "percentage": 64.41, "elapsed_time": "12:50:18", "remaining_time": "7:05:37"} +{"current_steps": 4560, "total_steps": 7064, "loss": 0.7873, "reward": null, "learning_rate": 1.3964393264866368e-05, "epoch": 1.29, "percentage": 64.55, "elapsed_time": "12:52:04", "remaining_time": "7:03:57"} +{"current_steps": 4560, "total_steps": 7064, "loss": 0.7873, "reward": null, "learning_rate": 1.3964393264866368e-05, "epoch": 1.29, "percentage": 64.55, "elapsed_time": "12:55:55", "remaining_time": "7:06:04"} +{"current_steps": 4560, "total_steps": 7064, "loss": 0.7873, "reward": null, "learning_rate": 1.3964393264866368e-05, "epoch": 1.29, "percentage": 64.55, "elapsed_time": "12:52:02", "remaining_time": "7:03:56"} +{"current_steps": 4560, "total_steps": 7064, "loss": 0.7873, "reward": null, "learning_rate": 1.3964393264866368e-05, "epoch": 1.29, "percentage": 64.55, "elapsed_time": "12:52:03", "remaining_time": "7:03:57"} +{"current_steps": 4570, "total_steps": 7064, "loss": 0.8033, "reward": null, "learning_rate": 1.386473820419244e-05, "epoch": 1.29, "percentage": 64.69, "elapsed_time": "12:53:43", "remaining_time": "7:02:14"} +{"current_steps": 4570, "total_steps": 7064, "loss": 0.8033, "reward": null, "learning_rate": 1.386473820419244e-05, "epoch": 1.29, "percentage": 64.69, "elapsed_time": "12:53:41", "remaining_time": "7:02:13"} +{"current_steps": 4570, "total_steps": 7064, "loss": 0.8033, "reward": null, "learning_rate": 1.386473820419244e-05, "epoch": 1.29, "percentage": 64.69, "elapsed_time": "12:53:42", "remaining_time": "7:02:14"} +{"current_steps": 4570, "total_steps": 7064, "loss": 0.8033, "reward": null, "learning_rate": 1.386473820419244e-05, "epoch": 1.29, "percentage": 64.69, "elapsed_time": "12:57:35", "remaining_time": "7:04:21"} +{"current_steps": 4580, "total_steps": 7064, "loss": 0.7973, "reward": null, "learning_rate": 1.376530338447294e-05, "epoch": 1.3, "percentage": 64.84, "elapsed_time": "12:59:16", "remaining_time": "7:02:38"} +{"current_steps": 4580, "total_steps": 7064, "loss": 0.7973, "reward": null, "learning_rate": 1.376530338447294e-05, "epoch": 1.3, "percentage": 64.84, "elapsed_time": "12:55:23", "remaining_time": "7:00:32"} +{"current_steps": 4580, "total_steps": 7064, "loss": 0.7973, "reward": null, "learning_rate": 1.376530338447294e-05, "epoch": 1.3, "percentage": 64.84, "elapsed_time": "12:55:24", "remaining_time": "7:00:32"} +{"current_steps": 4580, "total_steps": 7064, "loss": 0.7973, "reward": null, "learning_rate": 1.376530338447294e-05, "epoch": 1.3, "percentage": 64.84, "elapsed_time": "12:55:25", "remaining_time": "7:00:33"} +{"current_steps": 4590, "total_steps": 7064, "loss": 0.7736, "reward": null, "learning_rate": 1.366609077239889e-05, "epoch": 1.3, "percentage": 64.98, "elapsed_time": "12:57:05", "remaining_time": "6:58:50"} +{"current_steps": 4590, "total_steps": 7064, "loss": 0.7736, "reward": null, "learning_rate": 1.366609077239889e-05, "epoch": 1.3, "percentage": 64.98, "elapsed_time": "13:00:56", "remaining_time": "7:00:55"} +{"current_steps": 4590, "total_steps": 7064, "loss": 0.7736, "reward": null, "learning_rate": 1.366609077239889e-05, "epoch": 1.3, "percentage": 64.98, "elapsed_time": "12:57:03", "remaining_time": "6:58:49"} +{"current_steps": 4590, "total_steps": 7064, "loss": 0.7736, "reward": null, "learning_rate": 1.366609077239889e-05, "epoch": 1.3, "percentage": 64.98, "elapsed_time": "12:57:04", "remaining_time": "6:58:50"} +{"current_steps": 4600, "total_steps": 7064, "loss": 0.7968, "reward": null, "learning_rate": 1.3567102330266369e-05, "epoch": 1.3, "percentage": 65.12, "elapsed_time": "13:02:38", "remaining_time": "6:59:13"} +{"current_steps": 4600, "total_steps": 7064, "loss": 0.7968, "reward": null, "learning_rate": 1.3567102330266369e-05, "epoch": 1.3, "percentage": 65.12, "elapsed_time": "12:58:45", "remaining_time": "6:57:08"} +{"current_steps": 4600, "total_steps": 7064, "loss": 0.7968, "reward": null, "learning_rate": 1.3567102330266369e-05, "epoch": 1.3, "percentage": 65.12, "elapsed_time": "12:58:45", "remaining_time": "6:57:08"} +{"current_steps": 4600, "total_steps": 7064, "loss": 0.7968, "reward": null, "learning_rate": 1.3567102330266369e-05, "epoch": 1.3, "percentage": 65.12, "elapsed_time": "12:58:47", "remaining_time": "6:57:09"} +{"current_steps": 4610, "total_steps": 7064, "loss": 0.7773, "reward": null, "learning_rate": 1.3468340015937642e-05, "epoch": 1.31, "percentage": 65.26, "elapsed_time": "13:00:26", "remaining_time": "6:55:26"} +{"current_steps": 4610, "total_steps": 7064, "loss": 0.7773, "reward": null, "learning_rate": 1.3468340015937642e-05, "epoch": 1.31, "percentage": 65.26, "elapsed_time": "13:00:24", "remaining_time": "6:55:25"} +{"current_steps": 4610, "total_steps": 7064, "loss": 0.7773, "reward": null, "learning_rate": 1.3468340015937642e-05, "epoch": 1.31, "percentage": 65.26, "elapsed_time": "13:00:25", "remaining_time": "6:55:26"} +{"current_steps": 4610, "total_steps": 7064, "loss": 0.7773, "reward": null, "learning_rate": 1.3468340015937642e-05, "epoch": 1.31, "percentage": 65.26, "elapsed_time": "13:04:17", "remaining_time": "6:57:29"} +{"current_steps": 4620, "total_steps": 7064, "loss": 0.7971, "reward": null, "learning_rate": 1.3369805782802467e-05, "epoch": 1.31, "percentage": 65.4, "elapsed_time": "13:02:07", "remaining_time": "6:53:44"} +{"current_steps": 4620, "total_steps": 7064, "loss": 0.7971, "reward": null, "learning_rate": 1.3369805782802467e-05, "epoch": 1.31, "percentage": 65.4, "elapsed_time": "13:05:58", "remaining_time": "6:55:47"} +{"current_steps": 4620, "total_steps": 7064, "loss": 0.7971, "reward": null, "learning_rate": 1.3369805782802467e-05, "epoch": 1.31, "percentage": 65.4, "elapsed_time": "13:02:05", "remaining_time": "6:53:43"} +{"current_steps": 4620, "total_steps": 7064, "loss": 0.7971, "reward": null, "learning_rate": 1.3369805782802467e-05, "epoch": 1.31, "percentage": 65.4, "elapsed_time": "13:02:06", "remaining_time": "6:53:44"} +{"current_steps": 4630, "total_steps": 7064, "loss": 0.7808, "reward": null, "learning_rate": 1.3271501579739449e-05, "epoch": 1.31, "percentage": 65.54, "elapsed_time": "13:07:37", "remaining_time": "6:54:03"} +{"current_steps": 4630, "total_steps": 7064, "loss": 0.7808, "reward": null, "learning_rate": 1.3271501579739449e-05, "epoch": 1.31, "percentage": 65.54, "elapsed_time": "13:03:45", "remaining_time": "6:52:01"} +{"current_steps": 4630, "total_steps": 7064, "loss": 0.7808, "reward": null, "learning_rate": 1.3271501579739449e-05, "epoch": 1.31, "percentage": 65.54, "elapsed_time": "13:03:44", "remaining_time": "6:52:00"} +{"current_steps": 4630, "total_steps": 7064, "loss": 0.7808, "reward": null, "learning_rate": 1.3271501579739449e-05, "epoch": 1.31, "percentage": 65.54, "elapsed_time": "13:03:43", "remaining_time": "6:52:00"} +{"current_steps": 4640, "total_steps": 7064, "loss": 0.7826, "reward": null, "learning_rate": 1.317342935107752e-05, "epoch": 1.31, "percentage": 65.69, "elapsed_time": "13:09:24", "remaining_time": "6:52:23"} +{"current_steps": 4640, "total_steps": 7064, "loss": 0.7826, "reward": null, "learning_rate": 1.317342935107752e-05, "epoch": 1.31, "percentage": 65.69, "elapsed_time": "13:05:33", "remaining_time": "6:50:22"} +{"current_steps": 4640, "total_steps": 7064, "loss": 0.7826, "reward": null, "learning_rate": 1.317342935107752e-05, "epoch": 1.31, "percentage": 65.69, "elapsed_time": "13:05:31", "remaining_time": "6:50:21"} +{"current_steps": 4640, "total_steps": 7064, "loss": 0.7826, "reward": null, "learning_rate": 1.317342935107752e-05, "epoch": 1.31, "percentage": 65.69, "elapsed_time": "13:05:32", "remaining_time": "6:50:22"} +{"current_steps": 4650, "total_steps": 7064, "loss": 0.7767, "reward": null, "learning_rate": 1.307559103655743e-05, "epoch": 1.32, "percentage": 65.83, "elapsed_time": "13:07:14", "remaining_time": "6:48:41"} +{"current_steps": 4650, "total_steps": 7064, "loss": 0.7767, "reward": null, "learning_rate": 1.307559103655743e-05, "epoch": 1.32, "percentage": 65.83, "elapsed_time": "13:11:05", "remaining_time": "6:50:41"} +{"current_steps": 4650, "total_steps": 7064, "loss": 0.7767, "reward": null, "learning_rate": 1.307559103655743e-05, "epoch": 1.32, "percentage": 65.83, "elapsed_time": "13:07:13", "remaining_time": "6:48:40"} +{"current_steps": 4650, "total_steps": 7064, "loss": 0.7767, "reward": null, "learning_rate": 1.307559103655743e-05, "epoch": 1.32, "percentage": 65.83, "elapsed_time": "13:07:12", "remaining_time": "6:48:40"} +{"current_steps": 4660, "total_steps": 7064, "loss": 0.7962, "reward": null, "learning_rate": 1.2977988571293447e-05, "epoch": 1.32, "percentage": 65.97, "elapsed_time": "13:08:52", "remaining_time": "6:46:57"} +{"current_steps": 4660, "total_steps": 7064, "loss": 0.7962, "reward": null, "learning_rate": 1.2977988571293447e-05, "epoch": 1.32, "percentage": 65.97, "elapsed_time": "13:12:44", "remaining_time": "6:48:57"} +{"current_steps": 4660, "total_steps": 7064, "loss": 0.7962, "reward": null, "learning_rate": 1.2977988571293447e-05, "epoch": 1.32, "percentage": 65.97, "elapsed_time": "13:08:51", "remaining_time": "6:46:57"} +{"current_steps": 4660, "total_steps": 7064, "loss": 0.7962, "reward": null, "learning_rate": 1.2977988571293447e-05, "epoch": 1.32, "percentage": 65.97, "elapsed_time": "13:08:53", "remaining_time": "6:46:58"} +{"current_steps": 4670, "total_steps": 7064, "loss": 0.7876, "reward": null, "learning_rate": 1.288062388573501e-05, "epoch": 1.32, "percentage": 66.11, "elapsed_time": "13:14:27", "remaining_time": "6:47:15"} +{"current_steps": 4670, "total_steps": 7064, "loss": 0.7876, "reward": null, "learning_rate": 1.288062388573501e-05, "epoch": 1.32, "percentage": 66.11, "elapsed_time": "13:10:35", "remaining_time": "6:45:17"} +{"current_steps": 4670, "total_steps": 7064, "loss": 0.7876, "reward": null, "learning_rate": 1.288062388573501e-05, "epoch": 1.32, "percentage": 66.11, "elapsed_time": "13:10:34", "remaining_time": "6:45:16"} +{"current_steps": 4670, "total_steps": 7064, "loss": 0.7876, "reward": null, "learning_rate": 1.288062388573501e-05, "epoch": 1.32, "percentage": 66.11, "elapsed_time": "13:10:33", "remaining_time": "6:45:16"} +{"current_steps": 4680, "total_steps": 7064, "loss": 0.782, "reward": null, "learning_rate": 1.2783498905628622e-05, "epoch": 1.33, "percentage": 66.25, "elapsed_time": "13:12:18", "remaining_time": "6:43:36"} +{"current_steps": 4680, "total_steps": 7064, "loss": 0.782, "reward": null, "learning_rate": 1.2783498905628622e-05, "epoch": 1.33, "percentage": 66.25, "elapsed_time": "13:16:10", "remaining_time": "6:45:34"} +{"current_steps": 4680, "total_steps": 7064, "loss": 0.782, "reward": null, "learning_rate": 1.2783498905628622e-05, "epoch": 1.33, "percentage": 66.25, "elapsed_time": "13:12:17", "remaining_time": "6:43:35"} +{"current_steps": 4680, "total_steps": 7064, "loss": 0.782, "reward": null, "learning_rate": 1.2783498905628622e-05, "epoch": 1.33, "percentage": 66.25, "elapsed_time": "13:12:16", "remaining_time": "6:43:35"} +{"current_steps": 4690, "total_steps": 7064, "loss": 0.7926, "reward": null, "learning_rate": 1.2686615551979702e-05, "epoch": 1.33, "percentage": 66.39, "elapsed_time": "13:13:59", "remaining_time": "6:41:54"} +{"current_steps": 4690, "total_steps": 7064, "loss": 0.7926, "reward": null, "learning_rate": 1.2686615551979702e-05, "epoch": 1.33, "percentage": 66.39, "elapsed_time": "13:14:01", "remaining_time": "6:41:55"} +{"current_steps": 4690, "total_steps": 7064, "loss": 0.7926, "reward": null, "learning_rate": 1.2686615551979702e-05, "epoch": 1.33, "percentage": 66.39, "elapsed_time": "13:13:59", "remaining_time": "6:41:54"} +{"current_steps": 4690, "total_steps": 7064, "loss": 0.7926, "reward": null, "learning_rate": 1.2686615551979702e-05, "epoch": 1.33, "percentage": 66.39, "elapsed_time": "13:17:52", "remaining_time": "6:43:52"} +{"current_steps": 4700, "total_steps": 7064, "loss": 0.7939, "reward": null, "learning_rate": 1.2589975741014615e-05, "epoch": 1.33, "percentage": 66.53, "elapsed_time": "13:19:33", "remaining_time": "6:42:09"} +{"current_steps": 4700, "total_steps": 7064, "loss": 0.7939, "reward": null, "learning_rate": 1.2589975741014615e-05, "epoch": 1.33, "percentage": 66.53, "elapsed_time": "13:15:42", "remaining_time": "6:40:13"} +{"current_steps": 4700, "total_steps": 7064, "loss": 0.7939, "reward": null, "learning_rate": 1.2589975741014615e-05, "epoch": 1.33, "percentage": 66.53, "elapsed_time": "13:15:40", "remaining_time": "6:40:12"} +{"current_steps": 4700, "total_steps": 7064, "loss": 0.7939, "reward": null, "learning_rate": 1.2589975741014615e-05, "epoch": 1.33, "percentage": 66.53, "elapsed_time": "13:15:39", "remaining_time": "6:40:12"} +{"current_steps": 4710, "total_steps": 7064, "loss": 0.7992, "reward": null, "learning_rate": 1.2493581384142767e-05, "epoch": 1.33, "percentage": 66.68, "elapsed_time": "13:17:25", "remaining_time": "6:38:32"} +{"current_steps": 4710, "total_steps": 7064, "loss": 0.7992, "reward": null, "learning_rate": 1.2493581384142767e-05, "epoch": 1.33, "percentage": 66.68, "elapsed_time": "13:21:16", "remaining_time": "6:40:28"} +{"current_steps": 4710, "total_steps": 7064, "loss": 0.7992, "reward": null, "learning_rate": 1.2493581384142767e-05, "epoch": 1.33, "percentage": 66.68, "elapsed_time": "13:17:23", "remaining_time": "6:38:31"} +{"current_steps": 4710, "total_steps": 7064, "loss": 0.7992, "reward": null, "learning_rate": 1.2493581384142767e-05, "epoch": 1.33, "percentage": 66.68, "elapsed_time": "13:17:24", "remaining_time": "6:38:31"} +{"current_steps": 4720, "total_steps": 7064, "loss": 0.7766, "reward": null, "learning_rate": 1.2397434387918824e-05, "epoch": 1.34, "percentage": 66.82, "elapsed_time": "13:23:01", "remaining_time": "6:38:47"} +{"current_steps": 4720, "total_steps": 7064, "loss": 0.7766, "reward": null, "learning_rate": 1.2397434387918824e-05, "epoch": 1.34, "percentage": 66.82, "elapsed_time": "13:19:08", "remaining_time": "6:36:51"} +{"current_steps": 4720, "total_steps": 7064, "loss": 0.7766, "reward": null, "learning_rate": 1.2397434387918824e-05, "epoch": 1.34, "percentage": 66.82, "elapsed_time": "13:19:09", "remaining_time": "6:36:52"} +{"current_steps": 4720, "total_steps": 7064, "loss": 0.7766, "reward": null, "learning_rate": 1.2397434387918824e-05, "epoch": 1.34, "percentage": 66.82, "elapsed_time": "13:19:10", "remaining_time": "6:36:52"} +{"current_steps": 4730, "total_steps": 7064, "loss": 0.7887, "reward": null, "learning_rate": 1.2301536654004948e-05, "epoch": 1.34, "percentage": 66.96, "elapsed_time": "13:24:42", "remaining_time": "6:37:04"} +{"current_steps": 4730, "total_steps": 7064, "loss": 0.7887, "reward": null, "learning_rate": 1.2301536654004948e-05, "epoch": 1.34, "percentage": 66.96, "elapsed_time": "13:20:49", "remaining_time": "6:35:09"} +{"current_steps": 4730, "total_steps": 7064, "loss": 0.7887, "reward": null, "learning_rate": 1.2301536654004948e-05, "epoch": 1.34, "percentage": 66.96, "elapsed_time": "13:20:50", "remaining_time": "6:35:10"} +{"current_steps": 4730, "total_steps": 7064, "loss": 0.7887, "reward": null, "learning_rate": 1.2301536654004948e-05, "epoch": 1.34, "percentage": 66.96, "elapsed_time": "13:20:51", "remaining_time": "6:35:10"} +{"current_steps": 4740, "total_steps": 7064, "loss": 0.7927, "reward": null, "learning_rate": 1.2205890079133252e-05, "epoch": 1.34, "percentage": 67.1, "elapsed_time": "13:22:31", "remaining_time": "6:33:28"} +{"current_steps": 4740, "total_steps": 7064, "loss": 0.7927, "reward": null, "learning_rate": 1.2205890079133252e-05, "epoch": 1.34, "percentage": 67.1, "elapsed_time": "13:22:29", "remaining_time": "6:33:27"} +{"current_steps": 4740, "total_steps": 7064, "loss": 0.7927, "reward": null, "learning_rate": 1.2205890079133252e-05, "epoch": 1.34, "percentage": 67.1, "elapsed_time": "13:22:30", "remaining_time": "6:33:27"} +{"current_steps": 4740, "total_steps": 7064, "loss": 0.7927, "reward": null, "learning_rate": 1.2205890079133252e-05, "epoch": 1.34, "percentage": 67.1, "elapsed_time": "13:26:22", "remaining_time": "6:35:21"} +{"current_steps": 4750, "total_steps": 7064, "loss": 0.786, "reward": null, "learning_rate": 1.2110496555068218e-05, "epoch": 1.34, "percentage": 67.24, "elapsed_time": "13:24:17", "remaining_time": "6:31:49"} +{"current_steps": 4750, "total_steps": 7064, "loss": 0.786, "reward": null, "learning_rate": 1.2110496555068218e-05, "epoch": 1.34, "percentage": 67.24, "elapsed_time": "13:28:09", "remaining_time": "6:33:41"} +{"current_steps": 4750, "total_steps": 7064, "loss": 0.786, "reward": null, "learning_rate": 1.2110496555068218e-05, "epoch": 1.34, "percentage": 67.24, "elapsed_time": "13:24:15", "remaining_time": "6:31:48"} +{"current_steps": 4750, "total_steps": 7064, "loss": 0.786, "reward": null, "learning_rate": 1.2110496555068218e-05, "epoch": 1.34, "percentage": 67.24, "elapsed_time": "13:24:16", "remaining_time": "6:31:48"} +{"current_steps": 4760, "total_steps": 7064, "loss": 0.7821, "reward": null, "learning_rate": 1.2015357968569335e-05, "epoch": 1.35, "percentage": 67.38, "elapsed_time": "13:25:57", "remaining_time": "6:30:06"} +{"current_steps": 4760, "total_steps": 7064, "loss": 0.7821, "reward": null, "learning_rate": 1.2015357968569335e-05, "epoch": 1.35, "percentage": 67.38, "elapsed_time": "13:29:48", "remaining_time": "6:31:58"} +{"current_steps": 4760, "total_steps": 7064, "loss": 0.7821, "reward": null, "learning_rate": 1.2015357968569335e-05, "epoch": 1.35, "percentage": 67.38, "elapsed_time": "13:25:56", "remaining_time": "6:30:06"} +{"current_steps": 4760, "total_steps": 7064, "loss": 0.7821, "reward": null, "learning_rate": 1.2015357968569335e-05, "epoch": 1.35, "percentage": 67.38, "elapsed_time": "13:25:55", "remaining_time": "6:30:05"} +{"current_steps": 4770, "total_steps": 7064, "loss": 0.7864, "reward": null, "learning_rate": 1.1920476201353763e-05, "epoch": 1.35, "percentage": 67.53, "elapsed_time": "13:27:38", "remaining_time": "6:28:24"} +{"current_steps": 4770, "total_steps": 7064, "loss": 0.7864, "reward": null, "learning_rate": 1.1920476201353763e-05, "epoch": 1.35, "percentage": 67.53, "elapsed_time": "13:27:40", "remaining_time": "6:28:25"} +{"current_steps": 4770, "total_steps": 7064, "loss": 0.7864, "reward": null, "learning_rate": 1.1920476201353763e-05, "epoch": 1.35, "percentage": 67.53, "elapsed_time": "13:31:32", "remaining_time": "6:30:17"} +{"current_steps": 4770, "total_steps": 7064, "loss": 0.7864, "reward": null, "learning_rate": 1.1920476201353763e-05, "epoch": 1.35, "percentage": 67.53, "elapsed_time": "13:27:39", "remaining_time": "6:28:25"} +{"current_steps": 4780, "total_steps": 7064, "loss": 0.7888, "reward": null, "learning_rate": 1.1825853130059098e-05, "epoch": 1.35, "percentage": 67.67, "elapsed_time": "13:29:20", "remaining_time": "6:26:43"} +{"current_steps": 4780, "total_steps": 7064, "loss": 0.7888, "reward": null, "learning_rate": 1.1825853130059098e-05, "epoch": 1.35, "percentage": 67.67, "elapsed_time": "13:33:11", "remaining_time": "6:28:33"} +{"current_steps": 4780, "total_steps": 7064, "loss": 0.7888, "reward": null, "learning_rate": 1.1825853130059098e-05, "epoch": 1.35, "percentage": 67.67, "elapsed_time": "13:29:18", "remaining_time": "6:26:42"} +{"current_steps": 4780, "total_steps": 7064, "loss": 0.7888, "reward": null, "learning_rate": 1.1825853130059098e-05, "epoch": 1.35, "percentage": 67.67, "elapsed_time": "13:29:19", "remaining_time": "6:26:42"} +{"current_steps": 4790, "total_steps": 7064, "loss": 0.794, "reward": null, "learning_rate": 1.1731490626206263e-05, "epoch": 1.36, "percentage": 67.81, "elapsed_time": "13:31:01", "remaining_time": "6:25:01"} +{"current_steps": 4790, "total_steps": 7064, "loss": 0.794, "reward": null, "learning_rate": 1.1731490626206263e-05, "epoch": 1.36, "percentage": 67.81, "elapsed_time": "13:34:53", "remaining_time": "6:26:51"} +{"current_steps": 4790, "total_steps": 7064, "loss": 0.794, "reward": null, "learning_rate": 1.1731490626206263e-05, "epoch": 1.36, "percentage": 67.81, "elapsed_time": "13:31:00", "remaining_time": "6:25:01"} +{"current_steps": 4790, "total_steps": 7064, "loss": 0.794, "reward": null, "learning_rate": 1.1731490626206263e-05, "epoch": 1.36, "percentage": 67.81, "elapsed_time": "13:30:59", "remaining_time": "6:25:00"} +{"current_steps": 4800, "total_steps": 7064, "loss": 0.771, "reward": null, "learning_rate": 1.16373905561625e-05, "epoch": 1.36, "percentage": 67.95, "elapsed_time": "13:32:45", "remaining_time": "6:23:20"} +{"current_steps": 4800, "total_steps": 7064, "loss": 0.771, "reward": null, "learning_rate": 1.16373905561625e-05, "epoch": 1.36, "percentage": 67.95, "elapsed_time": "13:36:36", "remaining_time": "6:25:10"} +{"current_steps": 4800, "total_steps": 7064, "loss": 0.771, "reward": null, "learning_rate": 1.16373905561625e-05, "epoch": 1.36, "percentage": 67.95, "elapsed_time": "13:32:44", "remaining_time": "6:23:20"} +{"current_steps": 4800, "total_steps": 7064, "loss": 0.771, "reward": null, "learning_rate": 1.16373905561625e-05, "epoch": 1.36, "percentage": 67.95, "elapsed_time": "13:32:43", "remaining_time": "6:23:20"} +{"current_steps": 4810, "total_steps": 7064, "loss": 0.7984, "reward": null, "learning_rate": 1.1543554781104477e-05, "epoch": 1.36, "percentage": 68.09, "elapsed_time": "13:38:17", "remaining_time": "6:23:27"} +{"current_steps": 4810, "total_steps": 7064, "loss": 0.7984, "reward": null, "learning_rate": 1.1543554781104477e-05, "epoch": 1.36, "percentage": 68.09, "elapsed_time": "13:34:26", "remaining_time": "6:21:39"} +{"current_steps": 4810, "total_steps": 7064, "loss": 0.7984, "reward": null, "learning_rate": 1.1543554781104477e-05, "epoch": 1.36, "percentage": 68.09, "elapsed_time": "13:34:24", "remaining_time": "6:21:38"} +{"current_steps": 4810, "total_steps": 7064, "loss": 0.7984, "reward": null, "learning_rate": 1.1543554781104477e-05, "epoch": 1.36, "percentage": 68.09, "elapsed_time": "13:34:25", "remaining_time": "6:21:38"} +{"current_steps": 4820, "total_steps": 7064, "loss": 0.7961, "reward": null, "learning_rate": 1.1449985156981413e-05, "epoch": 1.36, "percentage": 68.23, "elapsed_time": "13:40:00", "remaining_time": "6:21:45"} +{"current_steps": 4820, "total_steps": 7064, "loss": 0.7961, "reward": null, "learning_rate": 1.1449985156981413e-05, "epoch": 1.36, "percentage": 68.23, "elapsed_time": "13:36:07", "remaining_time": "6:19:57"} +{"current_steps": 4820, "total_steps": 7064, "loss": 0.7961, "reward": null, "learning_rate": 1.1449985156981413e-05, "epoch": 1.36, "percentage": 68.23, "elapsed_time": "13:36:08", "remaining_time": "6:19:58"} +{"current_steps": 4820, "total_steps": 7064, "loss": 0.7961, "reward": null, "learning_rate": 1.1449985156981413e-05, "epoch": 1.36, "percentage": 68.23, "elapsed_time": "13:36:06", "remaining_time": "6:19:57"} +{"current_steps": 4830, "total_steps": 7064, "loss": 0.7824, "reward": null, "learning_rate": 1.1356683534478451e-05, "epoch": 1.37, "percentage": 68.37, "elapsed_time": "13:37:53", "remaining_time": "6:18:17"} +{"current_steps": 4830, "total_steps": 7064, "loss": 0.7824, "reward": null, "learning_rate": 1.1356683534478451e-05, "epoch": 1.37, "percentage": 68.37, "elapsed_time": "13:41:44", "remaining_time": "6:20:04"} +{"current_steps": 4830, "total_steps": 7064, "loss": 0.7824, "reward": null, "learning_rate": 1.1356683534478451e-05, "epoch": 1.37, "percentage": 68.37, "elapsed_time": "13:37:51", "remaining_time": "6:18:17"} +{"current_steps": 4830, "total_steps": 7064, "loss": 0.7824, "reward": null, "learning_rate": 1.1356683534478451e-05, "epoch": 1.37, "percentage": 68.37, "elapsed_time": "13:37:51", "remaining_time": "6:18:16"} +{"current_steps": 4840, "total_steps": 7064, "loss": 0.7867, "reward": null, "learning_rate": 1.1263651758979967e-05, "epoch": 1.37, "percentage": 68.52, "elapsed_time": "13:39:39", "remaining_time": "6:16:38"} +{"current_steps": 4840, "total_steps": 7064, "loss": 0.7867, "reward": null, "learning_rate": 1.1263651758979967e-05, "epoch": 1.37, "percentage": 68.52, "elapsed_time": "13:43:30", "remaining_time": "6:18:24"} +{"current_steps": 4840, "total_steps": 7064, "loss": 0.7867, "reward": null, "learning_rate": 1.1263651758979967e-05, "epoch": 1.37, "percentage": 68.52, "elapsed_time": "13:39:38", "remaining_time": "6:16:37"} +{"current_steps": 4840, "total_steps": 7064, "loss": 0.7867, "reward": null, "learning_rate": 1.1263651758979967e-05, "epoch": 1.37, "percentage": 68.52, "elapsed_time": "13:39:37", "remaining_time": "6:16:37"} +{"current_steps": 4850, "total_steps": 7064, "loss": 0.787, "reward": null, "learning_rate": 1.1170891670533162e-05, "epoch": 1.37, "percentage": 68.66, "elapsed_time": "13:45:15", "remaining_time": "6:16:43"} +{"current_steps": 4850, "total_steps": 7064, "loss": 0.787, "reward": null, "learning_rate": 1.1170891670533162e-05, "epoch": 1.37, "percentage": 68.66, "elapsed_time": "13:41:23", "remaining_time": "6:14:57"} +{"current_steps": 4850, "total_steps": 7064, "loss": 0.787, "reward": null, "learning_rate": 1.1170891670533162e-05, "epoch": 1.37, "percentage": 68.66, "elapsed_time": "13:41:21", "remaining_time": "6:14:56"} +{"current_steps": 4850, "total_steps": 7064, "loss": 0.787, "reward": null, "learning_rate": 1.1170891670533162e-05, "epoch": 1.37, "percentage": 68.66, "elapsed_time": "13:41:22", "remaining_time": "6:14:57"} +{"current_steps": 4860, "total_steps": 7064, "loss": 0.7789, "reward": null, "learning_rate": 1.107840510381158e-05, "epoch": 1.38, "percentage": 68.8, "elapsed_time": "13:43:05", "remaining_time": "6:13:16"} +{"current_steps": 4860, "total_steps": 7064, "loss": 0.7789, "reward": null, "learning_rate": 1.107840510381158e-05, "epoch": 1.38, "percentage": 68.8, "elapsed_time": "13:43:03", "remaining_time": "6:13:15"} +{"current_steps": 4860, "total_steps": 7064, "loss": 0.7789, "reward": null, "learning_rate": 1.107840510381158e-05, "epoch": 1.38, "percentage": 68.8, "elapsed_time": "13:46:56", "remaining_time": "6:15:01"} +{"current_steps": 4860, "total_steps": 7064, "loss": 0.7789, "reward": null, "learning_rate": 1.107840510381158e-05, "epoch": 1.38, "percentage": 68.8, "elapsed_time": "13:43:04", "remaining_time": "6:13:15"} +{"current_steps": 4870, "total_steps": 7064, "loss": 0.7951, "reward": null, "learning_rate": 1.0986193888078882e-05, "epoch": 1.38, "percentage": 68.94, "elapsed_time": "13:48:34", "remaining_time": "6:13:17"} +{"current_steps": 4870, "total_steps": 7064, "loss": 0.7951, "reward": null, "learning_rate": 1.0986193888078882e-05, "epoch": 1.38, "percentage": 68.94, "elapsed_time": "13:44:41", "remaining_time": "6:11:32"} +{"current_steps": 4870, "total_steps": 7064, "loss": 0.7951, "reward": null, "learning_rate": 1.0986193888078882e-05, "epoch": 1.38, "percentage": 68.94, "elapsed_time": "13:44:42", "remaining_time": "6:11:32"} +{"current_steps": 4870, "total_steps": 7064, "loss": 0.7951, "reward": null, "learning_rate": 1.0986193888078882e-05, "epoch": 1.38, "percentage": 68.94, "elapsed_time": "13:44:43", "remaining_time": "6:11:33"} +{"current_steps": 4880, "total_steps": 7064, "loss": 0.8037, "reward": null, "learning_rate": 1.0894259847152636e-05, "epoch": 1.38, "percentage": 69.08, "elapsed_time": "13:46:26", "remaining_time": "6:09:51"} +{"current_steps": 4880, "total_steps": 7064, "loss": 0.8037, "reward": null, "learning_rate": 1.0894259847152636e-05, "epoch": 1.38, "percentage": 69.08, "elapsed_time": "13:50:17", "remaining_time": "6:11:35"} +{"current_steps": 4880, "total_steps": 7064, "loss": 0.8037, "reward": null, "learning_rate": 1.0894259847152636e-05, "epoch": 1.38, "percentage": 69.08, "elapsed_time": "13:46:24", "remaining_time": "6:09:51"} +{"current_steps": 4880, "total_steps": 7064, "loss": 0.8037, "reward": null, "learning_rate": 1.0894259847152636e-05, "epoch": 1.38, "percentage": 69.08, "elapsed_time": "13:46:25", "remaining_time": "6:09:51"} +{"current_steps": 4890, "total_steps": 7064, "loss": 0.7901, "reward": null, "learning_rate": 1.0802604799368274e-05, "epoch": 1.38, "percentage": 69.22, "elapsed_time": "13:52:00", "remaining_time": "6:09:53"} +{"current_steps": 4890, "total_steps": 7064, "loss": 0.7901, "reward": null, "learning_rate": 1.0802604799368274e-05, "epoch": 1.38, "percentage": 69.22, "elapsed_time": "13:48:08", "remaining_time": "6:08:10"} +{"current_steps": 4890, "total_steps": 7064, "loss": 0.7901, "reward": null, "learning_rate": 1.0802604799368274e-05, "epoch": 1.38, "percentage": 69.22, "elapsed_time": "13:48:06", "remaining_time": "6:08:09"} +{"current_steps": 4890, "total_steps": 7064, "loss": 0.7901, "reward": null, "learning_rate": 1.0802604799368274e-05, "epoch": 1.38, "percentage": 69.22, "elapsed_time": "13:48:07", "remaining_time": "6:08:10"} +{"current_steps": 4900, "total_steps": 7064, "loss": 0.7736, "reward": null, "learning_rate": 1.0711230557543078e-05, "epoch": 1.39, "percentage": 69.37, "elapsed_time": "13:49:49", "remaining_time": "6:06:28"} +{"current_steps": 4900, "total_steps": 7064, "loss": 0.7736, "reward": null, "learning_rate": 1.0711230557543078e-05, "epoch": 1.39, "percentage": 69.37, "elapsed_time": "13:53:41", "remaining_time": "6:08:11"} +{"current_steps": 4900, "total_steps": 7064, "loss": 0.7736, "reward": null, "learning_rate": 1.0711230557543078e-05, "epoch": 1.39, "percentage": 69.37, "elapsed_time": "13:49:48", "remaining_time": "6:06:28"} +{"current_steps": 4900, "total_steps": 7064, "loss": 0.7736, "reward": null, "learning_rate": 1.0711230557543078e-05, "epoch": 1.39, "percentage": 69.37, "elapsed_time": "13:49:47", "remaining_time": "6:06:27"} +{"current_steps": 4910, "total_steps": 7064, "loss": 0.7743, "reward": null, "learning_rate": 1.0620138928940394e-05, "epoch": 1.39, "percentage": 69.51, "elapsed_time": "13:51:32", "remaining_time": "6:04:47"} +{"current_steps": 4910, "total_steps": 7064, "loss": 0.7743, "reward": null, "learning_rate": 1.0620138928940394e-05, "epoch": 1.39, "percentage": 69.51, "elapsed_time": "13:55:23", "remaining_time": "6:06:28"} +{"current_steps": 4910, "total_steps": 7064, "loss": 0.7743, "reward": null, "learning_rate": 1.0620138928940394e-05, "epoch": 1.39, "percentage": 69.51, "elapsed_time": "13:51:30", "remaining_time": "6:04:47"} +{"current_steps": 4910, "total_steps": 7064, "loss": 0.7743, "reward": null, "learning_rate": 1.0620138928940394e-05, "epoch": 1.39, "percentage": 69.51, "elapsed_time": "13:51:30", "remaining_time": "6:04:46"} +{"current_steps": 4920, "total_steps": 7064, "loss": 0.7971, "reward": null, "learning_rate": 1.0529331715233795e-05, "epoch": 1.39, "percentage": 69.65, "elapsed_time": "13:53:13", "remaining_time": "6:03:05"} +{"current_steps": 4920, "total_steps": 7064, "loss": 0.7971, "reward": null, "learning_rate": 1.0529331715233795e-05, "epoch": 1.39, "percentage": 69.65, "elapsed_time": "13:53:15", "remaining_time": "6:03:06"} +{"current_steps": 4920, "total_steps": 7064, "loss": 0.7971, "reward": null, "learning_rate": 1.0529331715233795e-05, "epoch": 1.39, "percentage": 69.65, "elapsed_time": "13:57:06", "remaining_time": "6:04:47"} +{"current_steps": 4920, "total_steps": 7064, "loss": 0.7971, "reward": null, "learning_rate": 1.0529331715233795e-05, "epoch": 1.39, "percentage": 69.65, "elapsed_time": "13:53:13", "remaining_time": "6:03:05"} +{"current_steps": 4930, "total_steps": 7064, "loss": 0.7812, "reward": null, "learning_rate": 1.0438810712471553e-05, "epoch": 1.4, "percentage": 69.79, "elapsed_time": "13:54:59", "remaining_time": "6:01:25"} +{"current_steps": 4930, "total_steps": 7064, "loss": 0.7812, "reward": null, "learning_rate": 1.0438810712471553e-05, "epoch": 1.4, "percentage": 69.79, "elapsed_time": "13:58:50", "remaining_time": "6:03:06"} +{"current_steps": 4930, "total_steps": 7064, "loss": 0.7812, "reward": null, "learning_rate": 1.0438810712471553e-05, "epoch": 1.4, "percentage": 69.79, "elapsed_time": "13:54:57", "remaining_time": "6:01:25"} +{"current_steps": 4930, "total_steps": 7064, "loss": 0.7812, "reward": null, "learning_rate": 1.0438810712471553e-05, "epoch": 1.4, "percentage": 69.79, "elapsed_time": "13:54:58", "remaining_time": "6:01:25"} +{"current_steps": 4940, "total_steps": 7064, "loss": 0.7788, "reward": null, "learning_rate": 1.0348577711041021e-05, "epoch": 1.4, "percentage": 69.93, "elapsed_time": "13:56:39", "remaining_time": "5:59:43"} +{"current_steps": 4940, "total_steps": 7064, "loss": 0.7788, "reward": null, "learning_rate": 1.0348577711041021e-05, "epoch": 1.4, "percentage": 69.93, "elapsed_time": "14:00:30", "remaining_time": "6:01:23"} +{"current_steps": 4940, "total_steps": 7064, "loss": 0.7788, "reward": null, "learning_rate": 1.0348577711041021e-05, "epoch": 1.4, "percentage": 69.93, "elapsed_time": "13:56:37", "remaining_time": "5:59:42"} +{"current_steps": 4940, "total_steps": 7064, "loss": 0.7788, "reward": null, "learning_rate": 1.0348577711041021e-05, "epoch": 1.4, "percentage": 69.93, "elapsed_time": "13:56:38", "remaining_time": "5:59:43"} +{"current_steps": 4950, "total_steps": 7064, "loss": 0.7866, "reward": null, "learning_rate": 1.0258634495633277e-05, "epoch": 1.4, "percentage": 70.07, "elapsed_time": "14:02:13", "remaining_time": "5:59:41"} +{"current_steps": 4950, "total_steps": 7064, "loss": 0.7866, "reward": null, "learning_rate": 1.0258634495633277e-05, "epoch": 1.4, "percentage": 70.07, "elapsed_time": "13:58:22", "remaining_time": "5:58:02"} +{"current_steps": 4950, "total_steps": 7064, "loss": 0.7866, "reward": null, "learning_rate": 1.0258634495633277e-05, "epoch": 1.4, "percentage": 70.07, "elapsed_time": "13:58:21", "remaining_time": "5:58:02"} +{"current_steps": 4950, "total_steps": 7064, "loss": 0.7866, "reward": null, "learning_rate": 1.0258634495633277e-05, "epoch": 1.4, "percentage": 70.07, "elapsed_time": "13:58:20", "remaining_time": "5:58:01"} +{"current_steps": 4960, "total_steps": 7064, "loss": 0.8023, "reward": null, "learning_rate": 1.0168982845207797e-05, "epoch": 1.4, "percentage": 70.22, "elapsed_time": "14:00:04", "remaining_time": "5:56:21"} +{"current_steps": 4960, "total_steps": 7064, "loss": 0.8023, "reward": null, "learning_rate": 1.0168982845207797e-05, "epoch": 1.4, "percentage": 70.22, "elapsed_time": "14:00:02", "remaining_time": "5:56:20"} +{"current_steps": 4960, "total_steps": 7064, "loss": 0.8023, "reward": null, "learning_rate": 1.0168982845207797e-05, "epoch": 1.4, "percentage": 70.22, "elapsed_time": "14:00:03", "remaining_time": "5:56:20"} +{"current_steps": 4960, "total_steps": 7064, "loss": 0.8023, "reward": null, "learning_rate": 1.0168982845207797e-05, "epoch": 1.4, "percentage": 70.22, "elapsed_time": "14:03:55", "remaining_time": "5:57:59"} +{"current_steps": 4970, "total_steps": 7064, "loss": 0.7766, "reward": null, "learning_rate": 1.0079624532957316e-05, "epoch": 1.41, "percentage": 70.36, "elapsed_time": "14:01:47", "remaining_time": "5:54:40"} +{"current_steps": 4970, "total_steps": 7064, "loss": 0.7766, "reward": null, "learning_rate": 1.0079624532957316e-05, "epoch": 1.41, "percentage": 70.36, "elapsed_time": "14:05:38", "remaining_time": "5:56:17"} +{"current_steps": 4970, "total_steps": 7064, "loss": 0.7766, "reward": null, "learning_rate": 1.0079624532957316e-05, "epoch": 1.41, "percentage": 70.36, "elapsed_time": "14:01:45", "remaining_time": "5:54:39"} +{"current_steps": 4970, "total_steps": 7064, "loss": 0.7766, "reward": null, "learning_rate": 1.0079624532957316e-05, "epoch": 1.41, "percentage": 70.36, "elapsed_time": "14:01:45", "remaining_time": "5:54:39"} +{"current_steps": 4980, "total_steps": 7064, "loss": 0.7831, "reward": null, "learning_rate": 9.99056132627267e-06, "epoch": 1.41, "percentage": 70.5, "elapsed_time": "14:03:32", "remaining_time": "5:53:00"} +{"current_steps": 4980, "total_steps": 7064, "loss": 0.7831, "reward": null, "learning_rate": 9.99056132627267e-06, "epoch": 1.41, "percentage": 70.5, "elapsed_time": "14:07:24", "remaining_time": "5:54:36"} +{"current_steps": 4980, "total_steps": 7064, "loss": 0.7831, "reward": null, "learning_rate": 9.99056132627267e-06, "epoch": 1.41, "percentage": 70.5, "elapsed_time": "14:03:30", "remaining_time": "5:52:59"} +{"current_steps": 4980, "total_steps": 7064, "loss": 0.7831, "reward": null, "learning_rate": 9.99056132627267e-06, "epoch": 1.41, "percentage": 70.5, "elapsed_time": "14:03:31", "remaining_time": "5:52:59"} +{"current_steps": 4990, "total_steps": 7064, "loss": 0.7927, "reward": null, "learning_rate": 9.901794986707941e-06, "epoch": 1.41, "percentage": 70.64, "elapsed_time": "14:05:13", "remaining_time": "5:51:18"} +{"current_steps": 4990, "total_steps": 7064, "loss": 0.7927, "reward": null, "learning_rate": 9.901794986707941e-06, "epoch": 1.41, "percentage": 70.64, "elapsed_time": "14:05:11", "remaining_time": "5:51:17"} +{"current_steps": 4990, "total_steps": 7064, "loss": 0.7927, "reward": null, "learning_rate": 9.901794986707941e-06, "epoch": 1.41, "percentage": 70.64, "elapsed_time": "14:09:05", "remaining_time": "5:52:54"} +{"current_steps": 4990, "total_steps": 7064, "loss": 0.7927, "reward": null, "learning_rate": 9.901794986707941e-06, "epoch": 1.41, "percentage": 70.64, "elapsed_time": "14:05:12", "remaining_time": "5:51:17"} +{"current_steps": 5000, "total_steps": 7064, "loss": 0.7852, "reward": null, "learning_rate": 9.813327269945547e-06, "epoch": 1.42, "percentage": 70.78, "elapsed_time": "14:10:52", "remaining_time": "5:51:14"} +{"current_steps": 5000, "total_steps": 7064, "loss": 0.7852, "reward": null, "learning_rate": 9.813327269945547e-06, "epoch": 1.42, "percentage": 70.78, "elapsed_time": "14:06:59", "remaining_time": "5:49:38"} +{"current_steps": 5000, "total_steps": 7064, "loss": 0.7852, "reward": null, "learning_rate": 9.813327269945547e-06, "epoch": 1.42, "percentage": 70.78, "elapsed_time": "14:07:00", "remaining_time": "5:49:38"} +{"current_steps": 5000, "total_steps": 7064, "loss": 0.7852, "reward": null, "learning_rate": 9.813327269945547e-06, "epoch": 1.42, "percentage": 70.78, "elapsed_time": "14:07:01", "remaining_time": "5:49:39"} +{"current_steps": 5010, "total_steps": 7064, "loss": 0.7649, "reward": null, "learning_rate": 9.725159925761532e-06, "epoch": 1.42, "percentage": 70.92, "elapsed_time": "14:12:35", "remaining_time": "5:49:32"} +{"current_steps": 5010, "total_steps": 7064, "loss": 0.7649, "reward": null, "learning_rate": 9.725159925761532e-06, "epoch": 1.42, "percentage": 70.92, "elapsed_time": "14:08:43", "remaining_time": "5:47:57"} +{"current_steps": 5010, "total_steps": 7064, "loss": 0.7649, "reward": null, "learning_rate": 9.725159925761532e-06, "epoch": 1.42, "percentage": 70.92, "elapsed_time": "14:08:42", "remaining_time": "5:47:57"} +{"current_steps": 5010, "total_steps": 7064, "loss": 0.7649, "reward": null, "learning_rate": 9.725159925761532e-06, "epoch": 1.42, "percentage": 70.92, "elapsed_time": "14:08:44", "remaining_time": "5:47:57"} +{"current_steps": 5020, "total_steps": 7064, "loss": 0.7818, "reward": null, "learning_rate": 9.637294697990961e-06, "epoch": 1.42, "percentage": 71.06, "elapsed_time": "14:14:16", "remaining_time": "5:47:50"} +{"current_steps": 5020, "total_steps": 7064, "loss": 0.7818, "reward": null, "learning_rate": 9.637294697990961e-06, "epoch": 1.42, "percentage": 71.06, "elapsed_time": "14:10:23", "remaining_time": "5:46:15"} +{"current_steps": 5020, "total_steps": 7064, "loss": 0.7818, "reward": null, "learning_rate": 9.637294697990961e-06, "epoch": 1.42, "percentage": 71.06, "elapsed_time": "14:10:24", "remaining_time": "5:46:15"} +{"current_steps": 5020, "total_steps": 7064, "loss": 0.7818, "reward": null, "learning_rate": 9.637294697990961e-06, "epoch": 1.42, "percentage": 71.06, "elapsed_time": "14:10:25", "remaining_time": "5:46:16"} +{"current_steps": 5030, "total_steps": 7064, "loss": 0.7789, "reward": null, "learning_rate": 9.549733324493431e-06, "epoch": 1.42, "percentage": 71.21, "elapsed_time": "14:16:00", "remaining_time": "5:46:08"} +{"current_steps": 5030, "total_steps": 7064, "loss": 0.7789, "reward": null, "learning_rate": 9.549733324493431e-06, "epoch": 1.42, "percentage": 71.21, "elapsed_time": "14:12:09", "remaining_time": "5:44:35"} +{"current_steps": 5030, "total_steps": 7064, "loss": 0.7789, "reward": null, "learning_rate": 9.549733324493431e-06, "epoch": 1.42, "percentage": 71.21, "elapsed_time": "14:12:07", "remaining_time": "5:44:34"} +{"current_steps": 5030, "total_steps": 7064, "loss": 0.7789, "reward": null, "learning_rate": 9.549733324493431e-06, "epoch": 1.42, "percentage": 71.21, "elapsed_time": "14:12:08", "remaining_time": "5:44:35"} +{"current_steps": 5040, "total_steps": 7064, "loss": 0.7636, "reward": null, "learning_rate": 9.462477537118717e-06, "epoch": 1.43, "percentage": 71.35, "elapsed_time": "14:13:51", "remaining_time": "5:42:54"} +{"current_steps": 5040, "total_steps": 7064, "loss": 0.7636, "reward": null, "learning_rate": 9.462477537118717e-06, "epoch": 1.43, "percentage": 71.35, "elapsed_time": "14:13:50", "remaining_time": "5:42:53"} +{"current_steps": 5040, "total_steps": 7064, "loss": 0.7636, "reward": null, "learning_rate": 9.462477537118717e-06, "epoch": 1.43, "percentage": 71.35, "elapsed_time": "14:13:49", "remaining_time": "5:42:53"} +{"current_steps": 5040, "total_steps": 7064, "loss": 0.7636, "reward": null, "learning_rate": 9.462477537118717e-06, "epoch": 1.43, "percentage": 71.35, "elapsed_time": "14:17:43", "remaining_time": "5:44:26"} +{"current_steps": 5050, "total_steps": 7064, "loss": 0.7832, "reward": null, "learning_rate": 9.375529061672467e-06, "epoch": 1.43, "percentage": 71.49, "elapsed_time": "14:15:35", "remaining_time": "5:41:13"} +{"current_steps": 5050, "total_steps": 7064, "loss": 0.7832, "reward": null, "learning_rate": 9.375529061672467e-06, "epoch": 1.43, "percentage": 71.49, "elapsed_time": "14:15:34", "remaining_time": "5:41:12"} +{"current_steps": 5050, "total_steps": 7064, "loss": 0.7832, "reward": null, "learning_rate": 9.375529061672467e-06, "epoch": 1.43, "percentage": 71.49, "elapsed_time": "14:19:26", "remaining_time": "5:42:45"} +{"current_steps": 5050, "total_steps": 7064, "loss": 0.7832, "reward": null, "learning_rate": 9.375529061672467e-06, "epoch": 1.43, "percentage": 71.49, "elapsed_time": "14:15:33", "remaining_time": "5:41:12"} +{"current_steps": 5060, "total_steps": 7064, "loss": 0.7959, "reward": null, "learning_rate": 9.288889617882136e-06, "epoch": 1.43, "percentage": 71.63, "elapsed_time": "14:21:09", "remaining_time": "5:41:03"} +{"current_steps": 5060, "total_steps": 7064, "loss": 0.7959, "reward": null, "learning_rate": 9.288889617882136e-06, "epoch": 1.43, "percentage": 71.63, "elapsed_time": "14:17:18", "remaining_time": "5:39:32"} +{"current_steps": 5060, "total_steps": 7064, "loss": 0.7959, "reward": null, "learning_rate": 9.288889617882136e-06, "epoch": 1.43, "percentage": 71.63, "elapsed_time": "14:17:17", "remaining_time": "5:39:31"} +{"current_steps": 5060, "total_steps": 7064, "loss": 0.7959, "reward": null, "learning_rate": 9.288889617882136e-06, "epoch": 1.43, "percentage": 71.63, "elapsed_time": "14:17:16", "remaining_time": "5:39:31"} +{"current_steps": 5070, "total_steps": 7064, "loss": 0.7896, "reward": null, "learning_rate": 9.202560919362896e-06, "epoch": 1.44, "percentage": 71.77, "elapsed_time": "14:19:00", "remaining_time": "5:37:50"} +{"current_steps": 5070, "total_steps": 7064, "loss": 0.7896, "reward": null, "learning_rate": 9.202560919362896e-06, "epoch": 1.44, "percentage": 71.77, "elapsed_time": "14:22:52", "remaining_time": "5:39:21"} +{"current_steps": 5070, "total_steps": 7064, "loss": 0.7896, "reward": null, "learning_rate": 9.202560919362896e-06, "epoch": 1.44, "percentage": 71.77, "elapsed_time": "14:18:58", "remaining_time": "5:37:49"} +{"current_steps": 5070, "total_steps": 7064, "loss": 0.7896, "reward": null, "learning_rate": 9.202560919362896e-06, "epoch": 1.44, "percentage": 71.77, "elapsed_time": "14:18:59", "remaining_time": "5:37:50"} +{"current_steps": 5080, "total_steps": 7064, "loss": 0.781, "reward": null, "learning_rate": 9.116544673583824e-06, "epoch": 1.44, "percentage": 71.91, "elapsed_time": "14:24:34", "remaining_time": "5:37:39"} +{"current_steps": 5080, "total_steps": 7064, "loss": 0.781, "reward": null, "learning_rate": 9.116544673583824e-06, "epoch": 1.44, "percentage": 71.91, "elapsed_time": "14:20:40", "remaining_time": "5:36:08"} +{"current_steps": 5080, "total_steps": 7064, "loss": 0.781, "reward": null, "learning_rate": 9.116544673583824e-06, "epoch": 1.44, "percentage": 71.91, "elapsed_time": "14:20:41", "remaining_time": "5:36:08"} +{"current_steps": 5080, "total_steps": 7064, "loss": 0.781, "reward": null, "learning_rate": 9.116544673583824e-06, "epoch": 1.44, "percentage": 71.91, "elapsed_time": "14:20:42", "remaining_time": "5:36:09"} +{"current_steps": 5090, "total_steps": 7064, "loss": 0.7876, "reward": null, "learning_rate": 9.030842581834062e-06, "epoch": 1.44, "percentage": 72.06, "elapsed_time": "14:22:26", "remaining_time": "5:34:28"} +{"current_steps": 5090, "total_steps": 7064, "loss": 0.7876, "reward": null, "learning_rate": 9.030842581834062e-06, "epoch": 1.44, "percentage": 72.06, "elapsed_time": "14:22:25", "remaining_time": "5:34:27"} +{"current_steps": 5090, "total_steps": 7064, "loss": 0.7876, "reward": null, "learning_rate": 9.030842581834062e-06, "epoch": 1.44, "percentage": 72.06, "elapsed_time": "14:22:24", "remaining_time": "5:34:27"} +{"current_steps": 5090, "total_steps": 7064, "loss": 0.7876, "reward": null, "learning_rate": 9.030842581834062e-06, "epoch": 1.44, "percentage": 72.06, "elapsed_time": "14:26:18", "remaining_time": "5:35:58"} +{"current_steps": 5100, "total_steps": 7064, "loss": 0.7818, "reward": null, "learning_rate": 8.945456339189198e-06, "epoch": 1.44, "percentage": 72.2, "elapsed_time": "14:27:58", "remaining_time": "5:34:15"} +{"current_steps": 5100, "total_steps": 7064, "loss": 0.7818, "reward": null, "learning_rate": 8.945456339189198e-06, "epoch": 1.44, "percentage": 72.2, "elapsed_time": "14:24:06", "remaining_time": "5:32:46"} +{"current_steps": 5100, "total_steps": 7064, "loss": 0.7818, "reward": null, "learning_rate": 8.945456339189198e-06, "epoch": 1.44, "percentage": 72.2, "elapsed_time": "14:24:04", "remaining_time": "5:32:45"} +{"current_steps": 5100, "total_steps": 7064, "loss": 0.7818, "reward": null, "learning_rate": 8.945456339189198e-06, "epoch": 1.44, "percentage": 72.2, "elapsed_time": "14:24:05", "remaining_time": "5:32:45"} +{"current_steps": 5110, "total_steps": 7064, "loss": 0.7851, "reward": null, "learning_rate": 8.860387634477736e-06, "epoch": 1.45, "percentage": 72.34, "elapsed_time": "14:25:50", "remaining_time": "5:31:05"} +{"current_steps": 5110, "total_steps": 7064, "loss": 0.7851, "reward": null, "learning_rate": 8.860387634477736e-06, "epoch": 1.45, "percentage": 72.34, "elapsed_time": "14:29:41", "remaining_time": "5:32:33"} +{"current_steps": 5110, "total_steps": 7064, "loss": 0.7851, "reward": null, "learning_rate": 8.860387634477736e-06, "epoch": 1.45, "percentage": 72.34, "elapsed_time": "14:25:49", "remaining_time": "5:31:04"} +{"current_steps": 5110, "total_steps": 7064, "loss": 0.7851, "reward": null, "learning_rate": 8.860387634477736e-06, "epoch": 1.45, "percentage": 72.34, "elapsed_time": "14:25:48", "remaining_time": "5:31:04"} +{"current_steps": 5120, "total_steps": 7064, "loss": 0.7824, "reward": null, "learning_rate": 8.775638150247714e-06, "epoch": 1.45, "percentage": 72.48, "elapsed_time": "14:27:29", "remaining_time": "5:29:22"} +{"current_steps": 5120, "total_steps": 7064, "loss": 0.7824, "reward": null, "learning_rate": 8.775638150247714e-06, "epoch": 1.45, "percentage": 72.48, "elapsed_time": "14:27:29", "remaining_time": "5:29:22"} +{"current_steps": 5120, "total_steps": 7064, "loss": 0.7824, "reward": null, "learning_rate": 8.775638150247714e-06, "epoch": 1.45, "percentage": 72.48, "elapsed_time": "14:27:31", "remaining_time": "5:29:23"} +{"current_steps": 5120, "total_steps": 7064, "loss": 0.7824, "reward": null, "learning_rate": 8.775638150247714e-06, "epoch": 1.45, "percentage": 72.48, "elapsed_time": "14:31:22", "remaining_time": "5:30:50"} +{"current_steps": 5130, "total_steps": 7064, "loss": 0.7988, "reward": null, "learning_rate": 8.691209562733371e-06, "epoch": 1.45, "percentage": 72.62, "elapsed_time": "14:29:13", "remaining_time": "5:27:41"} +{"current_steps": 5130, "total_steps": 7064, "loss": 0.7988, "reward": null, "learning_rate": 8.691209562733371e-06, "epoch": 1.45, "percentage": 72.62, "elapsed_time": "14:33:05", "remaining_time": "5:29:09"} +{"current_steps": 5130, "total_steps": 7064, "loss": 0.7988, "reward": null, "learning_rate": 8.691209562733371e-06, "epoch": 1.45, "percentage": 72.62, "elapsed_time": "14:29:12", "remaining_time": "5:27:41"} +{"current_steps": 5130, "total_steps": 7064, "loss": 0.7988, "reward": null, "learning_rate": 8.691209562733371e-06, "epoch": 1.45, "percentage": 72.62, "elapsed_time": "14:29:11", "remaining_time": "5:27:41"} +{"current_steps": 5140, "total_steps": 7064, "loss": 0.7771, "reward": null, "learning_rate": 8.607103541822068e-06, "epoch": 1.46, "percentage": 72.76, "elapsed_time": "14:30:51", "remaining_time": "5:25:58"} +{"current_steps": 5140, "total_steps": 7064, "loss": 0.7771, "reward": null, "learning_rate": 8.607103541822068e-06, "epoch": 1.46, "percentage": 72.76, "elapsed_time": "14:34:42", "remaining_time": "5:27:25"} +{"current_steps": 5140, "total_steps": 7064, "loss": 0.7771, "reward": null, "learning_rate": 8.607103541822068e-06, "epoch": 1.46, "percentage": 72.76, "elapsed_time": "14:30:50", "remaining_time": "5:25:58"} +{"current_steps": 5140, "total_steps": 7064, "loss": 0.7771, "reward": null, "learning_rate": 8.607103541822068e-06, "epoch": 1.46, "percentage": 72.76, "elapsed_time": "14:30:49", "remaining_time": "5:25:58"} +{"current_steps": 5150, "total_steps": 7064, "loss": 0.7888, "reward": null, "learning_rate": 8.523321751021176e-06, "epoch": 1.46, "percentage": 72.9, "elapsed_time": "14:32:37", "remaining_time": "5:24:18"} +{"current_steps": 5150, "total_steps": 7064, "loss": 0.7888, "reward": null, "learning_rate": 8.523321751021176e-06, "epoch": 1.46, "percentage": 72.9, "elapsed_time": "14:32:35", "remaining_time": "5:24:17"} +{"current_steps": 5150, "total_steps": 7064, "loss": 0.7888, "reward": null, "learning_rate": 8.523321751021176e-06, "epoch": 1.46, "percentage": 72.9, "elapsed_time": "14:32:36", "remaining_time": "5:24:18"} +{"current_steps": 5150, "total_steps": 7064, "loss": 0.7888, "reward": null, "learning_rate": 8.523321751021176e-06, "epoch": 1.46, "percentage": 72.9, "elapsed_time": "14:36:28", "remaining_time": "5:25:44"} +{"current_steps": 5160, "total_steps": 7064, "loss": 0.794, "reward": null, "learning_rate": 8.43986584742526e-06, "epoch": 1.46, "percentage": 73.05, "elapsed_time": "14:34:21", "remaining_time": "5:22:37"} +{"current_steps": 5160, "total_steps": 7064, "loss": 0.794, "reward": null, "learning_rate": 8.43986584742526e-06, "epoch": 1.46, "percentage": 73.05, "elapsed_time": "14:38:12", "remaining_time": "5:24:03"} +{"current_steps": 5160, "total_steps": 7064, "loss": 0.794, "reward": null, "learning_rate": 8.43986584742526e-06, "epoch": 1.46, "percentage": 73.05, "elapsed_time": "14:34:19", "remaining_time": "5:22:37"} +{"current_steps": 5160, "total_steps": 7064, "loss": 0.794, "reward": null, "learning_rate": 8.43986584742526e-06, "epoch": 1.46, "percentage": 73.05, "elapsed_time": "14:34:20", "remaining_time": "5:22:37"} +{"current_steps": 5170, "total_steps": 7064, "loss": 0.7854, "reward": null, "learning_rate": 8.35673748168323e-06, "epoch": 1.46, "percentage": 73.19, "elapsed_time": "14:39:53", "remaining_time": "5:22:20"} +{"current_steps": 5170, "total_steps": 7064, "loss": 0.7854, "reward": null, "learning_rate": 8.35673748168323e-06, "epoch": 1.46, "percentage": 73.19, "elapsed_time": "14:36:00", "remaining_time": "5:20:55"} +{"current_steps": 5170, "total_steps": 7064, "loss": 0.7854, "reward": null, "learning_rate": 8.35673748168323e-06, "epoch": 1.46, "percentage": 73.19, "elapsed_time": "14:36:01", "remaining_time": "5:20:55"} +{"current_steps": 5170, "total_steps": 7064, "loss": 0.7854, "reward": null, "learning_rate": 8.35673748168323e-06, "epoch": 1.46, "percentage": 73.19, "elapsed_time": "14:36:02", "remaining_time": "5:20:55"} +{"current_steps": 5180, "total_steps": 7064, "loss": 0.7927, "reward": null, "learning_rate": 8.273938297965736e-06, "epoch": 1.47, "percentage": 73.33, "elapsed_time": "14:37:47", "remaining_time": "5:19:15"} +{"current_steps": 5180, "total_steps": 7064, "loss": 0.7927, "reward": null, "learning_rate": 8.273938297965736e-06, "epoch": 1.47, "percentage": 73.33, "elapsed_time": "14:41:38", "remaining_time": "5:20:39"} +{"current_steps": 5180, "total_steps": 7064, "loss": 0.7927, "reward": null, "learning_rate": 8.273938297965736e-06, "epoch": 1.47, "percentage": 73.33, "elapsed_time": "14:37:46", "remaining_time": "5:19:15"} +{"current_steps": 5180, "total_steps": 7064, "loss": 0.7927, "reward": null, "learning_rate": 8.273938297965736e-06, "epoch": 1.47, "percentage": 73.33, "elapsed_time": "14:37:45", "remaining_time": "5:19:14"} +{"current_steps": 5190, "total_steps": 7064, "loss": 0.801, "reward": null, "learning_rate": 8.191469933932625e-06, "epoch": 1.47, "percentage": 73.47, "elapsed_time": "14:39:27", "remaining_time": "5:17:33"} +{"current_steps": 5190, "total_steps": 7064, "loss": 0.801, "reward": null, "learning_rate": 8.191469933932625e-06, "epoch": 1.47, "percentage": 73.47, "elapsed_time": "14:39:25", "remaining_time": "5:17:32"} +{"current_steps": 5190, "total_steps": 7064, "loss": 0.801, "reward": null, "learning_rate": 8.191469933932625e-06, "epoch": 1.47, "percentage": 73.47, "elapsed_time": "14:39:26", "remaining_time": "5:17:32"} +{"current_steps": 5190, "total_steps": 7064, "loss": 0.801, "reward": null, "learning_rate": 8.191469933932625e-06, "epoch": 1.47, "percentage": 73.47, "elapsed_time": "14:43:18", "remaining_time": "5:18:56"} +{"current_steps": 5200, "total_steps": 7064, "loss": 0.7816, "reward": null, "learning_rate": 8.109334020700591e-06, "epoch": 1.47, "percentage": 73.61, "elapsed_time": "14:45:02", "remaining_time": "5:17:15"} +{"current_steps": 5200, "total_steps": 7064, "loss": 0.7816, "reward": null, "learning_rate": 8.109334020700591e-06, "epoch": 1.47, "percentage": 73.61, "elapsed_time": "14:41:09", "remaining_time": "5:15:51"} +{"current_steps": 5200, "total_steps": 7064, "loss": 0.7816, "reward": null, "learning_rate": 8.109334020700591e-06, "epoch": 1.47, "percentage": 73.61, "elapsed_time": "14:41:10", "remaining_time": "5:15:52"} +{"current_steps": 5200, "total_steps": 7064, "loss": 0.7816, "reward": null, "learning_rate": 8.109334020700591e-06, "epoch": 1.47, "percentage": 73.61, "elapsed_time": "14:41:11", "remaining_time": "5:15:52"} +{"current_steps": 5210, "total_steps": 7064, "loss": 0.7912, "reward": null, "learning_rate": 8.027532182810845e-06, "epoch": 1.48, "percentage": 73.75, "elapsed_time": "14:42:52", "remaining_time": "5:14:10"} +{"current_steps": 5210, "total_steps": 7064, "loss": 0.7912, "reward": null, "learning_rate": 8.027532182810845e-06, "epoch": 1.48, "percentage": 73.75, "elapsed_time": "14:46:44", "remaining_time": "5:15:32"} +{"current_steps": 5210, "total_steps": 7064, "loss": 0.7912, "reward": null, "learning_rate": 8.027532182810845e-06, "epoch": 1.48, "percentage": 73.75, "elapsed_time": "14:42:51", "remaining_time": "5:14:10"} +{"current_steps": 5210, "total_steps": 7064, "loss": 0.7912, "reward": null, "learning_rate": 8.027532182810845e-06, "epoch": 1.48, "percentage": 73.75, "elapsed_time": "14:42:50", "remaining_time": "5:14:09"} +{"current_steps": 5220, "total_steps": 7064, "loss": 0.7818, "reward": null, "learning_rate": 7.946066038197065e-06, "epoch": 1.48, "percentage": 73.9, "elapsed_time": "14:44:33", "remaining_time": "5:12:28"} +{"current_steps": 5220, "total_steps": 7064, "loss": 0.7818, "reward": null, "learning_rate": 7.946066038197065e-06, "epoch": 1.48, "percentage": 73.9, "elapsed_time": "14:44:31", "remaining_time": "5:12:27"} +{"current_steps": 5220, "total_steps": 7064, "loss": 0.7818, "reward": null, "learning_rate": 7.946066038197065e-06, "epoch": 1.48, "percentage": 73.9, "elapsed_time": "14:44:32", "remaining_time": "5:12:28"} +{"current_steps": 5220, "total_steps": 7064, "loss": 0.7818, "reward": null, "learning_rate": 7.946066038197065e-06, "epoch": 1.48, "percentage": 73.9, "elapsed_time": "14:48:25", "remaining_time": "5:13:50"} +{"current_steps": 5230, "total_steps": 7064, "loss": 0.7833, "reward": null, "learning_rate": 7.86493719815333e-06, "epoch": 1.48, "percentage": 74.04, "elapsed_time": "14:46:13", "remaining_time": "5:10:46"} +{"current_steps": 5230, "total_steps": 7064, "loss": 0.7833, "reward": null, "learning_rate": 7.86493719815333e-06, "epoch": 1.48, "percentage": 74.04, "elapsed_time": "14:46:12", "remaining_time": "5:10:46"} +{"current_steps": 5230, "total_steps": 7064, "loss": 0.7833, "reward": null, "learning_rate": 7.86493719815333e-06, "epoch": 1.48, "percentage": 74.04, "elapsed_time": "14:46:11", "remaining_time": "5:10:45"} +{"current_steps": 5230, "total_steps": 7064, "loss": 0.7833, "reward": null, "learning_rate": 7.86493719815333e-06, "epoch": 1.48, "percentage": 74.04, "elapsed_time": "14:50:05", "remaining_time": "5:12:07"} +{"current_steps": 5240, "total_steps": 7064, "loss": 0.7919, "reward": null, "learning_rate": 7.784147267302274e-06, "epoch": 1.48, "percentage": 74.18, "elapsed_time": "14:51:45", "remaining_time": "5:10:24"} +{"current_steps": 5240, "total_steps": 7064, "loss": 0.7919, "reward": null, "learning_rate": 7.784147267302274e-06, "epoch": 1.48, "percentage": 74.18, "elapsed_time": "14:47:54", "remaining_time": "5:09:04"} +{"current_steps": 5240, "total_steps": 7064, "loss": 0.7919, "reward": null, "learning_rate": 7.784147267302274e-06, "epoch": 1.48, "percentage": 74.18, "elapsed_time": "14:47:52", "remaining_time": "5:09:03"} +{"current_steps": 5240, "total_steps": 7064, "loss": 0.7919, "reward": null, "learning_rate": 7.784147267302274e-06, "epoch": 1.48, "percentage": 74.18, "elapsed_time": "14:47:53", "remaining_time": "5:09:04"} +{"current_steps": 5250, "total_steps": 7064, "loss": 0.771, "reward": null, "learning_rate": 7.70369784356336e-06, "epoch": 1.49, "percentage": 74.32, "elapsed_time": "14:53:30", "remaining_time": "5:08:43"} +{"current_steps": 5250, "total_steps": 7064, "loss": 0.771, "reward": null, "learning_rate": 7.70369784356336e-06, "epoch": 1.49, "percentage": 74.32, "elapsed_time": "14:49:36", "remaining_time": "5:07:22"} +{"current_steps": 5250, "total_steps": 7064, "loss": 0.771, "reward": null, "learning_rate": 7.70369784356336e-06, "epoch": 1.49, "percentage": 74.32, "elapsed_time": "14:49:37", "remaining_time": "5:07:23"} +{"current_steps": 5250, "total_steps": 7064, "loss": 0.771, "reward": null, "learning_rate": 7.70369784356336e-06, "epoch": 1.49, "percentage": 74.32, "elapsed_time": "14:49:38", "remaining_time": "5:07:23"} +{"current_steps": 5260, "total_steps": 7064, "loss": 0.7887, "reward": null, "learning_rate": 7.62359051812124e-06, "epoch": 1.49, "percentage": 74.46, "elapsed_time": "14:55:15", "remaining_time": "5:07:02"} +{"current_steps": 5260, "total_steps": 7064, "loss": 0.7887, "reward": null, "learning_rate": 7.62359051812124e-06, "epoch": 1.49, "percentage": 74.46, "elapsed_time": "14:51:22", "remaining_time": "5:05:42"} +{"current_steps": 5260, "total_steps": 7064, "loss": 0.7887, "reward": null, "learning_rate": 7.62359051812124e-06, "epoch": 1.49, "percentage": 74.46, "elapsed_time": "14:51:22", "remaining_time": "5:05:42"} +{"current_steps": 5260, "total_steps": 7064, "loss": 0.7887, "reward": null, "learning_rate": 7.62359051812124e-06, "epoch": 1.49, "percentage": 74.46, "elapsed_time": "14:51:24", "remaining_time": "5:05:43"} +{"current_steps": 5270, "total_steps": 7064, "loss": 0.7744, "reward": null, "learning_rate": 7.543826875394347e-06, "epoch": 1.49, "percentage": 74.6, "elapsed_time": "14:56:55", "remaining_time": "5:05:19"} +{"current_steps": 5270, "total_steps": 7064, "loss": 0.7744, "reward": null, "learning_rate": 7.543826875394347e-06, "epoch": 1.49, "percentage": 74.6, "elapsed_time": "14:53:02", "remaining_time": "5:04:00"} +{"current_steps": 5270, "total_steps": 7064, "loss": 0.7744, "reward": null, "learning_rate": 7.543826875394347e-06, "epoch": 1.49, "percentage": 74.6, "elapsed_time": "14:53:03", "remaining_time": "5:04:00"} +{"current_steps": 5270, "total_steps": 7064, "loss": 0.7744, "reward": null, "learning_rate": 7.543826875394347e-06, "epoch": 1.49, "percentage": 74.6, "elapsed_time": "14:53:04", "remaining_time": "5:04:00"} +{"current_steps": 5280, "total_steps": 7064, "loss": 0.7887, "reward": null, "learning_rate": 7.464408493003483e-06, "epoch": 1.49, "percentage": 74.75, "elapsed_time": "14:54:45", "remaining_time": "5:02:19"} +{"current_steps": 5280, "total_steps": 7064, "loss": 0.7887, "reward": null, "learning_rate": 7.464408493003483e-06, "epoch": 1.49, "percentage": 74.75, "elapsed_time": "14:58:38", "remaining_time": "5:03:37"} +{"current_steps": 5280, "total_steps": 7064, "loss": 0.7887, "reward": null, "learning_rate": 7.464408493003483e-06, "epoch": 1.49, "percentage": 74.75, "elapsed_time": "14:54:46", "remaining_time": "5:02:19"} +{"current_steps": 5280, "total_steps": 7064, "loss": 0.7887, "reward": null, "learning_rate": 7.464408493003483e-06, "epoch": 1.49, "percentage": 74.75, "elapsed_time": "14:54:47", "remaining_time": "5:02:19"} +{"current_steps": 5290, "total_steps": 7064, "loss": 0.7638, "reward": null, "learning_rate": 7.385336941740678e-06, "epoch": 1.5, "percentage": 74.89, "elapsed_time": "15:00:20", "remaining_time": "5:01:55"} +{"current_steps": 5290, "total_steps": 7064, "loss": 0.7638, "reward": null, "learning_rate": 7.385336941740678e-06, "epoch": 1.5, "percentage": 74.89, "elapsed_time": "14:56:29", "remaining_time": "5:00:38"} +{"current_steps": 5290, "total_steps": 7064, "loss": 0.7638, "reward": null, "learning_rate": 7.385336941740678e-06, "epoch": 1.5, "percentage": 74.89, "elapsed_time": "14:56:27", "remaining_time": "5:00:37"} +{"current_steps": 5290, "total_steps": 7064, "loss": 0.7638, "reward": null, "learning_rate": 7.385336941740678e-06, "epoch": 1.5, "percentage": 74.89, "elapsed_time": "14:56:28", "remaining_time": "5:00:37"} +{"current_steps": 5300, "total_steps": 7064, "loss": 0.7778, "reward": null, "learning_rate": 7.306613785538066e-06, "epoch": 1.5, "percentage": 75.03, "elapsed_time": "14:58:10", "remaining_time": "4:58:56"} +{"current_steps": 5300, "total_steps": 7064, "loss": 0.7778, "reward": null, "learning_rate": 7.306613785538066e-06, "epoch": 1.5, "percentage": 75.03, "elapsed_time": "14:58:09", "remaining_time": "4:58:55"} +{"current_steps": 5300, "total_steps": 7064, "loss": 0.7778, "reward": null, "learning_rate": 7.306613785538066e-06, "epoch": 1.5, "percentage": 75.03, "elapsed_time": "14:58:08", "remaining_time": "4:58:55"} +{"current_steps": 5300, "total_steps": 7064, "loss": 0.7778, "reward": null, "learning_rate": 7.306613785538066e-06, "epoch": 1.5, "percentage": 75.03, "elapsed_time": "15:02:01", "remaining_time": "5:00:13"} +{"current_steps": 5310, "total_steps": 7064, "loss": 0.7769, "reward": null, "learning_rate": 7.2282405814370125e-06, "epoch": 1.5, "percentage": 75.17, "elapsed_time": "15:03:45", "remaining_time": "4:58:31"} +{"current_steps": 5310, "total_steps": 7064, "loss": 0.7769, "reward": null, "learning_rate": 7.2282405814370125e-06, "epoch": 1.5, "percentage": 75.17, "elapsed_time": "14:59:52", "remaining_time": "4:57:14"} +{"current_steps": 5310, "total_steps": 7064, "loss": 0.7769, "reward": null, "learning_rate": 7.2282405814370125e-06, "epoch": 1.5, "percentage": 75.17, "elapsed_time": "14:59:53", "remaining_time": "4:57:15"} +{"current_steps": 5310, "total_steps": 7064, "loss": 0.7769, "reward": null, "learning_rate": 7.2282405814370125e-06, "epoch": 1.5, "percentage": 75.17, "elapsed_time": "14:59:54", "remaining_time": "4:57:15"} +{"current_steps": 5320, "total_steps": 7064, "loss": 0.7916, "reward": null, "learning_rate": 7.150218879557263e-06, "epoch": 1.51, "percentage": 75.31, "elapsed_time": "15:05:25", "remaining_time": "4:56:48"} +{"current_steps": 5320, "total_steps": 7064, "loss": 0.7916, "reward": null, "learning_rate": 7.150218879557263e-06, "epoch": 1.51, "percentage": 75.31, "elapsed_time": "15:01:34", "remaining_time": "4:55:33"} +{"current_steps": 5320, "total_steps": 7064, "loss": 0.7916, "reward": null, "learning_rate": 7.150218879557263e-06, "epoch": 1.51, "percentage": 75.31, "elapsed_time": "15:01:33", "remaining_time": "4:55:32"} +{"current_steps": 5320, "total_steps": 7064, "loss": 0.7916, "reward": null, "learning_rate": 7.150218879557263e-06, "epoch": 1.51, "percentage": 75.31, "elapsed_time": "15:01:32", "remaining_time": "4:55:32"} +{"current_steps": 5330, "total_steps": 7064, "loss": 0.7798, "reward": null, "learning_rate": 7.072550223066321e-06, "epoch": 1.51, "percentage": 75.45, "elapsed_time": "15:03:13", "remaining_time": "4:53:50"} +{"current_steps": 5330, "total_steps": 7064, "loss": 0.7798, "reward": null, "learning_rate": 7.072550223066321e-06, "epoch": 1.51, "percentage": 75.45, "elapsed_time": "15:07:05", "remaining_time": "4:55:06"} +{"current_steps": 5330, "total_steps": 7064, "loss": 0.7798, "reward": null, "learning_rate": 7.072550223066321e-06, "epoch": 1.51, "percentage": 75.45, "elapsed_time": "15:03:12", "remaining_time": "4:53:50"} +{"current_steps": 5330, "total_steps": 7064, "loss": 0.7798, "reward": null, "learning_rate": 7.072550223066321e-06, "epoch": 1.51, "percentage": 75.45, "elapsed_time": "15:03:14", "remaining_time": "4:53:50"} +{"current_steps": 5340, "total_steps": 7064, "loss": 0.7733, "reward": null, "learning_rate": 6.9952361481488896e-06, "epoch": 1.51, "percentage": 75.59, "elapsed_time": "15:04:57", "remaining_time": "4:52:09"} +{"current_steps": 5340, "total_steps": 7064, "loss": 0.7733, "reward": null, "learning_rate": 6.9952361481488896e-06, "epoch": 1.51, "percentage": 75.59, "elapsed_time": "15:08:49", "remaining_time": "4:53:24"} +{"current_steps": 5340, "total_steps": 7064, "loss": 0.7733, "reward": null, "learning_rate": 6.9952361481488896e-06, "epoch": 1.51, "percentage": 75.59, "elapsed_time": "15:04:56", "remaining_time": "4:52:09"} +{"current_steps": 5340, "total_steps": 7064, "loss": 0.7733, "reward": null, "learning_rate": 6.9952361481488896e-06, "epoch": 1.51, "percentage": 75.59, "elapsed_time": "15:04:55", "remaining_time": "4:52:09"} +{"current_steps": 5350, "total_steps": 7064, "loss": 0.7701, "reward": null, "learning_rate": 6.918278183976554e-06, "epoch": 1.51, "percentage": 75.74, "elapsed_time": "15:10:29", "remaining_time": "4:51:41"} +{"current_steps": 5350, "total_steps": 7064, "loss": 0.7701, "reward": null, "learning_rate": 6.918278183976554e-06, "epoch": 1.51, "percentage": 75.74, "elapsed_time": "15:06:38", "remaining_time": "4:50:27"} +{"current_steps": 5350, "total_steps": 7064, "loss": 0.7701, "reward": null, "learning_rate": 6.918278183976554e-06, "epoch": 1.51, "percentage": 75.74, "elapsed_time": "15:06:36", "remaining_time": "4:50:27"} +{"current_steps": 5350, "total_steps": 7064, "loss": 0.7701, "reward": null, "learning_rate": 6.918278183976554e-06, "epoch": 1.51, "percentage": 75.74, "elapsed_time": "15:06:37", "remaining_time": "4:50:27"} +{"current_steps": 5360, "total_steps": 7064, "loss": 0.7792, "reward": null, "learning_rate": 6.841677852677447e-06, "epoch": 1.52, "percentage": 75.88, "elapsed_time": "15:08:16", "remaining_time": "4:48:45"} +{"current_steps": 5360, "total_steps": 7064, "loss": 0.7792, "reward": null, "learning_rate": 6.841677852677447e-06, "epoch": 1.52, "percentage": 75.88, "elapsed_time": "15:08:14", "remaining_time": "4:48:44"} +{"current_steps": 5360, "total_steps": 7064, "loss": 0.7792, "reward": null, "learning_rate": 6.841677852677447e-06, "epoch": 1.52, "percentage": 75.88, "elapsed_time": "15:08:15", "remaining_time": "4:48:44"} +{"current_steps": 5360, "total_steps": 7064, "loss": 0.7792, "reward": null, "learning_rate": 6.841677852677447e-06, "epoch": 1.52, "percentage": 75.88, "elapsed_time": "15:12:07", "remaining_time": "4:49:58"} +{"current_steps": 5370, "total_steps": 7064, "loss": 0.7863, "reward": null, "learning_rate": 6.765436669306227e-06, "epoch": 1.52, "percentage": 76.02, "elapsed_time": "15:09:59", "remaining_time": "4:47:03"} +{"current_steps": 5370, "total_steps": 7064, "loss": 0.7863, "reward": null, "learning_rate": 6.765436669306227e-06, "epoch": 1.52, "percentage": 76.02, "elapsed_time": "15:13:51", "remaining_time": "4:48:16"} +{"current_steps": 5370, "total_steps": 7064, "loss": 0.7863, "reward": null, "learning_rate": 6.765436669306227e-06, "epoch": 1.52, "percentage": 76.02, "elapsed_time": "15:09:58", "remaining_time": "4:47:03"} +{"current_steps": 5370, "total_steps": 7064, "loss": 0.7863, "reward": null, "learning_rate": 6.765436669306227e-06, "epoch": 1.52, "percentage": 76.02, "elapsed_time": "15:09:57", "remaining_time": "4:47:03"} +{"current_steps": 5380, "total_steps": 7064, "loss": 0.7821, "reward": null, "learning_rate": 6.689556141814043e-06, "epoch": 1.52, "percentage": 76.16, "elapsed_time": "15:11:37", "remaining_time": "4:45:20"} +{"current_steps": 5380, "total_steps": 7064, "loss": 0.7821, "reward": null, "learning_rate": 6.689556141814043e-06, "epoch": 1.52, "percentage": 76.16, "elapsed_time": "15:11:38", "remaining_time": "4:45:21"} +{"current_steps": 5380, "total_steps": 7064, "loss": 0.7821, "reward": null, "learning_rate": 6.689556141814043e-06, "epoch": 1.52, "percentage": 76.16, "elapsed_time": "15:11:36", "remaining_time": "4:45:20"} +{"current_steps": 5380, "total_steps": 7064, "loss": 0.7821, "reward": null, "learning_rate": 6.689556141814043e-06, "epoch": 1.52, "percentage": 76.16, "elapsed_time": "15:15:29", "remaining_time": "4:46:33"} +{"current_steps": 5390, "total_steps": 7064, "loss": 0.7896, "reward": null, "learning_rate": 6.614037771018775e-06, "epoch": 1.53, "percentage": 76.3, "elapsed_time": "15:13:21", "remaining_time": "4:43:40"} +{"current_steps": 5390, "total_steps": 7064, "loss": 0.7896, "reward": null, "learning_rate": 6.614037771018775e-06, "epoch": 1.53, "percentage": 76.3, "elapsed_time": "15:17:13", "remaining_time": "4:44:51"} +{"current_steps": 5390, "total_steps": 7064, "loss": 0.7896, "reward": null, "learning_rate": 6.614037771018775e-06, "epoch": 1.53, "percentage": 76.3, "elapsed_time": "15:13:20", "remaining_time": "4:43:39"} +{"current_steps": 5390, "total_steps": 7064, "loss": 0.7896, "reward": null, "learning_rate": 6.614037771018775e-06, "epoch": 1.53, "percentage": 76.3, "elapsed_time": "15:13:19", "remaining_time": "4:43:39"} +{"current_steps": 5400, "total_steps": 7064, "loss": 0.7943, "reward": null, "learning_rate": 6.538883050575284e-06, "epoch": 1.53, "percentage": 76.44, "elapsed_time": "15:18:52", "remaining_time": "4:43:08"} +{"current_steps": 5400, "total_steps": 7064, "loss": 0.7943, "reward": null, "learning_rate": 6.538883050575284e-06, "epoch": 1.53, "percentage": 76.44, "elapsed_time": "15:14:59", "remaining_time": "4:41:57"} +{"current_steps": 5400, "total_steps": 7064, "loss": 0.7943, "reward": null, "learning_rate": 6.538883050575284e-06, "epoch": 1.53, "percentage": 76.44, "elapsed_time": "15:14:59", "remaining_time": "4:41:57"} +{"current_steps": 5400, "total_steps": 7064, "loss": 0.7943, "reward": null, "learning_rate": 6.538883050575284e-06, "epoch": 1.53, "percentage": 76.44, "elapsed_time": "15:15:01", "remaining_time": "4:41:57"} +{"current_steps": 5410, "total_steps": 7064, "loss": 0.7933, "reward": null, "learning_rate": 6.464093466945919e-06, "epoch": 1.53, "percentage": 76.59, "elapsed_time": "15:20:37", "remaining_time": "4:41:27"} +{"current_steps": 5410, "total_steps": 7064, "loss": 0.7933, "reward": null, "learning_rate": 6.464093466945919e-06, "epoch": 1.53, "percentage": 76.59, "elapsed_time": "15:16:43", "remaining_time": "4:40:16"} +{"current_steps": 5410, "total_steps": 7064, "loss": 0.7933, "reward": null, "learning_rate": 6.464093466945919e-06, "epoch": 1.53, "percentage": 76.59, "elapsed_time": "15:16:44", "remaining_time": "4:40:16"} +{"current_steps": 5410, "total_steps": 7064, "loss": 0.7933, "reward": null, "learning_rate": 6.464093466945919e-06, "epoch": 1.53, "percentage": 76.59, "elapsed_time": "15:16:45", "remaining_time": "4:40:16"} +{"current_steps": 5420, "total_steps": 7064, "loss": 0.7773, "reward": null, "learning_rate": 6.389670499371089e-06, "epoch": 1.53, "percentage": 76.73, "elapsed_time": "15:18:29", "remaining_time": "4:38:35"} +{"current_steps": 5420, "total_steps": 7064, "loss": 0.7773, "reward": null, "learning_rate": 6.389670499371089e-06, "epoch": 1.53, "percentage": 76.73, "elapsed_time": "15:18:27", "remaining_time": "4:38:35"} +{"current_steps": 5420, "total_steps": 7064, "loss": 0.7773, "reward": null, "learning_rate": 6.389670499371089e-06, "epoch": 1.53, "percentage": 76.73, "elapsed_time": "15:22:20", "remaining_time": "4:39:45"} +{"current_steps": 5420, "total_steps": 7064, "loss": 0.7773, "reward": null, "learning_rate": 6.389670499371089e-06, "epoch": 1.53, "percentage": 76.73, "elapsed_time": "15:18:28", "remaining_time": "4:38:35"} +{"current_steps": 5430, "total_steps": 7064, "loss": 0.7828, "reward": null, "learning_rate": 6.3156156198400315e-06, "epoch": 1.54, "percentage": 76.87, "elapsed_time": "15:24:03", "remaining_time": "4:38:03"} +{"current_steps": 5430, "total_steps": 7064, "loss": 0.7828, "reward": null, "learning_rate": 6.3156156198400315e-06, "epoch": 1.54, "percentage": 76.87, "elapsed_time": "15:20:09", "remaining_time": "4:36:53"} +{"current_steps": 5430, "total_steps": 7064, "loss": 0.7828, "reward": null, "learning_rate": 6.3156156198400315e-06, "epoch": 1.54, "percentage": 76.87, "elapsed_time": "15:20:10", "remaining_time": "4:36:54"} +{"current_steps": 5430, "total_steps": 7064, "loss": 0.7828, "reward": null, "learning_rate": 6.3156156198400315e-06, "epoch": 1.54, "percentage": 76.87, "elapsed_time": "15:20:11", "remaining_time": "4:36:54"} +{"current_steps": 5440, "total_steps": 7064, "loss": 0.7769, "reward": null, "learning_rate": 6.241930293061662e-06, "epoch": 1.54, "percentage": 77.01, "elapsed_time": "15:21:54", "remaining_time": "4:35:13"} +{"current_steps": 5440, "total_steps": 7064, "loss": 0.7769, "reward": null, "learning_rate": 6.241930293061662e-06, "epoch": 1.54, "percentage": 77.01, "elapsed_time": "15:25:46", "remaining_time": "4:36:22"} +{"current_steps": 5440, "total_steps": 7064, "loss": 0.7769, "reward": null, "learning_rate": 6.241930293061662e-06, "epoch": 1.54, "percentage": 77.01, "elapsed_time": "15:21:53", "remaining_time": "4:35:12"} +{"current_steps": 5440, "total_steps": 7064, "loss": 0.7769, "reward": null, "learning_rate": 6.241930293061662e-06, "epoch": 1.54, "percentage": 77.01, "elapsed_time": "15:21:52", "remaining_time": "4:35:12"} +{"current_steps": 5450, "total_steps": 7064, "loss": 0.7726, "reward": null, "learning_rate": 6.16861597643564e-06, "epoch": 1.54, "percentage": 77.15, "elapsed_time": "15:23:34", "remaining_time": "4:33:30"} +{"current_steps": 5450, "total_steps": 7064, "loss": 0.7726, "reward": null, "learning_rate": 6.16861597643564e-06, "epoch": 1.54, "percentage": 77.15, "elapsed_time": "15:23:33", "remaining_time": "4:33:30"} +{"current_steps": 5450, "total_steps": 7064, "loss": 0.7726, "reward": null, "learning_rate": 6.16861597643564e-06, "epoch": 1.54, "percentage": 77.15, "elapsed_time": "15:23:32", "remaining_time": "4:33:30"} +{"current_steps": 5450, "total_steps": 7064, "loss": 0.7726, "reward": null, "learning_rate": 6.16861597643564e-06, "epoch": 1.54, "percentage": 77.15, "elapsed_time": "15:27:25", "remaining_time": "4:34:39"} +{"current_steps": 5460, "total_steps": 7064, "loss": 0.7956, "reward": null, "learning_rate": 6.0956741200235315e-06, "epoch": 1.55, "percentage": 77.29, "elapsed_time": "15:29:08", "remaining_time": "4:32:57"} +{"current_steps": 5460, "total_steps": 7064, "loss": 0.7956, "reward": null, "learning_rate": 6.0956741200235315e-06, "epoch": 1.55, "percentage": 77.29, "elapsed_time": "15:25:15", "remaining_time": "4:31:48"} +{"current_steps": 5460, "total_steps": 7064, "loss": 0.7956, "reward": null, "learning_rate": 6.0956741200235315e-06, "epoch": 1.55, "percentage": 77.29, "elapsed_time": "15:25:16", "remaining_time": "4:31:49"} +{"current_steps": 5460, "total_steps": 7064, "loss": 0.7956, "reward": null, "learning_rate": 6.0956741200235315e-06, "epoch": 1.55, "percentage": 77.29, "elapsed_time": "15:25:17", "remaining_time": "4:31:49"} +{"current_steps": 5470, "total_steps": 7064, "loss": 0.7932, "reward": null, "learning_rate": 6.023106166520104e-06, "epoch": 1.55, "percentage": 77.43, "elapsed_time": "15:26:59", "remaining_time": "4:30:07"} +{"current_steps": 5470, "total_steps": 7064, "loss": 0.7932, "reward": null, "learning_rate": 6.023106166520104e-06, "epoch": 1.55, "percentage": 77.43, "elapsed_time": "15:30:50", "remaining_time": "4:31:15"} +{"current_steps": 5470, "total_steps": 7064, "loss": 0.7932, "reward": null, "learning_rate": 6.023106166520104e-06, "epoch": 1.55, "percentage": 77.43, "elapsed_time": "15:26:58", "remaining_time": "4:30:07"} +{"current_steps": 5470, "total_steps": 7064, "loss": 0.7932, "reward": null, "learning_rate": 6.023106166520104e-06, "epoch": 1.55, "percentage": 77.43, "elapsed_time": "15:26:57", "remaining_time": "4:30:07"} +{"current_steps": 5480, "total_steps": 7064, "loss": 0.7849, "reward": null, "learning_rate": 5.950913551224838e-06, "epoch": 1.55, "percentage": 77.58, "elapsed_time": "15:32:32", "remaining_time": "4:29:33"} +{"current_steps": 5480, "total_steps": 7064, "loss": 0.7849, "reward": null, "learning_rate": 5.950913551224838e-06, "epoch": 1.55, "percentage": 77.58, "elapsed_time": "15:28:41", "remaining_time": "4:28:26"} +{"current_steps": 5480, "total_steps": 7064, "loss": 0.7849, "reward": null, "learning_rate": 5.950913551224838e-06, "epoch": 1.55, "percentage": 77.58, "elapsed_time": "15:28:39", "remaining_time": "4:28:25"} +{"current_steps": 5480, "total_steps": 7064, "loss": 0.7849, "reward": null, "learning_rate": 5.950913551224838e-06, "epoch": 1.55, "percentage": 77.58, "elapsed_time": "15:28:40", "remaining_time": "4:28:25"} +{"current_steps": 5490, "total_steps": 7064, "loss": 0.7968, "reward": null, "learning_rate": 5.879097702013495e-06, "epoch": 1.55, "percentage": 77.72, "elapsed_time": "15:30:18", "remaining_time": "4:26:43"} +{"current_steps": 5490, "total_steps": 7064, "loss": 0.7968, "reward": null, "learning_rate": 5.879097702013495e-06, "epoch": 1.55, "percentage": 77.72, "elapsed_time": "15:34:12", "remaining_time": "4:27:50"} +{"current_steps": 5490, "total_steps": 7064, "loss": 0.7968, "reward": null, "learning_rate": 5.879097702013495e-06, "epoch": 1.55, "percentage": 77.72, "elapsed_time": "15:30:19", "remaining_time": "4:26:43"} +{"current_steps": 5490, "total_steps": 7064, "loss": 0.7968, "reward": null, "learning_rate": 5.879097702013495e-06, "epoch": 1.55, "percentage": 77.72, "elapsed_time": "15:30:20", "remaining_time": "4:26:44"} +{"current_steps": 5500, "total_steps": 7064, "loss": 0.7827, "reward": null, "learning_rate": 5.807660039309904e-06, "epoch": 1.56, "percentage": 77.86, "elapsed_time": "15:31:59", "remaining_time": "4:25:01"} +{"current_steps": 5500, "total_steps": 7064, "loss": 0.7827, "reward": null, "learning_rate": 5.807660039309904e-06, "epoch": 1.56, "percentage": 77.86, "elapsed_time": "15:35:53", "remaining_time": "4:26:07"} +{"current_steps": 5500, "total_steps": 7064, "loss": 0.7827, "reward": null, "learning_rate": 5.807660039309904e-06, "epoch": 1.56, "percentage": 77.86, "elapsed_time": "15:32:00", "remaining_time": "4:25:01"} +{"current_steps": 5500, "total_steps": 7064, "loss": 0.7827, "reward": null, "learning_rate": 5.807660039309904e-06, "epoch": 1.56, "percentage": 77.86, "elapsed_time": "15:32:01", "remaining_time": "4:25:02"} +{"current_steps": 5510, "total_steps": 7064, "loss": 0.791, "reward": null, "learning_rate": 5.736601976057848e-06, "epoch": 1.56, "percentage": 78.0, "elapsed_time": "15:37:35", "remaining_time": "4:24:25"} +{"current_steps": 5510, "total_steps": 7064, "loss": 0.791, "reward": null, "learning_rate": 5.736601976057848e-06, "epoch": 1.56, "percentage": 78.0, "elapsed_time": "15:33:44", "remaining_time": "4:23:20"} +{"current_steps": 5510, "total_steps": 7064, "loss": 0.791, "reward": null, "learning_rate": 5.736601976057848e-06, "epoch": 1.56, "percentage": 78.0, "elapsed_time": "15:33:43", "remaining_time": "4:23:20"} +{"current_steps": 5510, "total_steps": 7064, "loss": 0.791, "reward": null, "learning_rate": 5.736601976057848e-06, "epoch": 1.56, "percentage": 78.0, "elapsed_time": "15:33:42", "remaining_time": "4:23:20"} +{"current_steps": 5520, "total_steps": 7064, "loss": 0.7792, "reward": null, "learning_rate": 5.66592491769315e-06, "epoch": 1.56, "percentage": 78.14, "elapsed_time": "15:39:20", "remaining_time": "4:22:44"} +{"current_steps": 5520, "total_steps": 7064, "loss": 0.7792, "reward": null, "learning_rate": 5.66592491769315e-06, "epoch": 1.56, "percentage": 78.14, "elapsed_time": "15:35:28", "remaining_time": "4:21:39"} +{"current_steps": 5520, "total_steps": 7064, "loss": 0.7792, "reward": null, "learning_rate": 5.66592491769315e-06, "epoch": 1.56, "percentage": 78.14, "elapsed_time": "15:35:29", "remaining_time": "4:21:39"} +{"current_steps": 5520, "total_steps": 7064, "loss": 0.7792, "reward": null, "learning_rate": 5.66592491769315e-06, "epoch": 1.56, "percentage": 78.14, "elapsed_time": "15:35:27", "remaining_time": "4:21:39"} +{"current_steps": 5530, "total_steps": 7064, "loss": 0.7808, "reward": null, "learning_rate": 5.595630262115825e-06, "epoch": 1.57, "percentage": 78.28, "elapsed_time": "15:37:08", "remaining_time": "4:19:57"} +{"current_steps": 5530, "total_steps": 7064, "loss": 0.7808, "reward": null, "learning_rate": 5.595630262115825e-06, "epoch": 1.57, "percentage": 78.28, "elapsed_time": "15:41:00", "remaining_time": "4:21:01"} +{"current_steps": 5530, "total_steps": 7064, "loss": 0.7808, "reward": null, "learning_rate": 5.595630262115825e-06, "epoch": 1.57, "percentage": 78.28, "elapsed_time": "15:37:07", "remaining_time": "4:19:57"} +{"current_steps": 5530, "total_steps": 7064, "loss": 0.7808, "reward": null, "learning_rate": 5.595630262115825e-06, "epoch": 1.57, "percentage": 78.28, "elapsed_time": "15:37:06", "remaining_time": "4:19:57"} +{"current_steps": 5540, "total_steps": 7064, "loss": 0.7723, "reward": null, "learning_rate": 5.525719399662488e-06, "epoch": 1.57, "percentage": 78.43, "elapsed_time": "15:38:45", "remaining_time": "4:18:14"} +{"current_steps": 5540, "total_steps": 7064, "loss": 0.7723, "reward": null, "learning_rate": 5.525719399662488e-06, "epoch": 1.57, "percentage": 78.43, "elapsed_time": "15:42:37", "remaining_time": "4:19:18"} +{"current_steps": 5540, "total_steps": 7064, "loss": 0.7723, "reward": null, "learning_rate": 5.525719399662488e-06, "epoch": 1.57, "percentage": 78.43, "elapsed_time": "15:38:44", "remaining_time": "4:18:14"} +{"current_steps": 5540, "total_steps": 7064, "loss": 0.7723, "reward": null, "learning_rate": 5.525719399662488e-06, "epoch": 1.57, "percentage": 78.43, "elapsed_time": "15:38:43", "remaining_time": "4:18:14"} +{"current_steps": 5550, "total_steps": 7064, "loss": 0.7789, "reward": null, "learning_rate": 5.456193713078797e-06, "epoch": 1.57, "percentage": 78.57, "elapsed_time": "15:40:29", "remaining_time": "4:16:33"} +{"current_steps": 5550, "total_steps": 7064, "loss": 0.7789, "reward": null, "learning_rate": 5.456193713078797e-06, "epoch": 1.57, "percentage": 78.57, "elapsed_time": "15:40:28", "remaining_time": "4:16:33"} +{"current_steps": 5550, "total_steps": 7064, "loss": 0.7789, "reward": null, "learning_rate": 5.456193713078797e-06, "epoch": 1.57, "percentage": 78.57, "elapsed_time": "15:40:27", "remaining_time": "4:16:33"} +{"current_steps": 5550, "total_steps": 7064, "loss": 0.7789, "reward": null, "learning_rate": 5.456193713078797e-06, "epoch": 1.57, "percentage": 78.57, "elapsed_time": "15:44:20", "remaining_time": "4:17:36"} +{"current_steps": 5560, "total_steps": 7064, "loss": 0.7903, "reward": null, "learning_rate": 5.387054577492165e-06, "epoch": 1.57, "percentage": 78.71, "elapsed_time": "15:42:10", "remaining_time": "4:14:51"} +{"current_steps": 5560, "total_steps": 7064, "loss": 0.7903, "reward": null, "learning_rate": 5.387054577492165e-06, "epoch": 1.57, "percentage": 78.71, "elapsed_time": "15:46:02", "remaining_time": "4:15:54"} +{"current_steps": 5560, "total_steps": 7064, "loss": 0.7903, "reward": null, "learning_rate": 5.387054577492165e-06, "epoch": 1.57, "percentage": 78.71, "elapsed_time": "15:42:09", "remaining_time": "4:14:51"} +{"current_steps": 5560, "total_steps": 7064, "loss": 0.7903, "reward": null, "learning_rate": 5.387054577492165e-06, "epoch": 1.57, "percentage": 78.71, "elapsed_time": "15:42:08", "remaining_time": "4:14:51"} +{"current_steps": 5570, "total_steps": 7064, "loss": 0.7801, "reward": null, "learning_rate": 5.318303360384508e-06, "epoch": 1.58, "percentage": 78.85, "elapsed_time": "15:43:52", "remaining_time": "4:13:10"} +{"current_steps": 5570, "total_steps": 7064, "loss": 0.7801, "reward": null, "learning_rate": 5.318303360384508e-06, "epoch": 1.58, "percentage": 78.85, "elapsed_time": "15:43:51", "remaining_time": "4:13:09"} +{"current_steps": 5570, "total_steps": 7064, "loss": 0.7801, "reward": null, "learning_rate": 5.318303360384508e-06, "epoch": 1.58, "percentage": 78.85, "elapsed_time": "15:47:43", "remaining_time": "4:14:12"} +{"current_steps": 5570, "total_steps": 7064, "loss": 0.7801, "reward": null, "learning_rate": 5.318303360384508e-06, "epoch": 1.58, "percentage": 78.85, "elapsed_time": "15:43:50", "remaining_time": "4:13:09"} +{"current_steps": 5580, "total_steps": 7064, "loss": 0.7733, "reward": null, "learning_rate": 5.249941421565227e-06, "epoch": 1.58, "percentage": 78.99, "elapsed_time": "15:49:26", "remaining_time": "4:12:30"} +{"current_steps": 5580, "total_steps": 7064, "loss": 0.7733, "reward": null, "learning_rate": 5.249941421565227e-06, "epoch": 1.58, "percentage": 78.99, "elapsed_time": "15:45:35", "remaining_time": "4:11:28"} +{"current_steps": 5580, "total_steps": 7064, "loss": 0.7733, "reward": null, "learning_rate": 5.249941421565227e-06, "epoch": 1.58, "percentage": 78.99, "elapsed_time": "15:45:33", "remaining_time": "4:11:28"} +{"current_steps": 5580, "total_steps": 7064, "loss": 0.7733, "reward": null, "learning_rate": 5.249941421565227e-06, "epoch": 1.58, "percentage": 78.99, "elapsed_time": "15:45:34", "remaining_time": "4:11:28"} +{"current_steps": 5590, "total_steps": 7064, "loss": 0.7891, "reward": null, "learning_rate": 5.181970113144296e-06, "epoch": 1.58, "percentage": 79.13, "elapsed_time": "15:47:20", "remaining_time": "4:09:47"} +{"current_steps": 5590, "total_steps": 7064, "loss": 0.7891, "reward": null, "learning_rate": 5.181970113144296e-06, "epoch": 1.58, "percentage": 79.13, "elapsed_time": "15:47:18", "remaining_time": "4:09:47"} +{"current_steps": 5590, "total_steps": 7064, "loss": 0.7891, "reward": null, "learning_rate": 5.181970113144296e-06, "epoch": 1.58, "percentage": 79.13, "elapsed_time": "15:47:19", "remaining_time": "4:09:47"} +{"current_steps": 5590, "total_steps": 7064, "loss": 0.7891, "reward": null, "learning_rate": 5.181970113144296e-06, "epoch": 1.58, "percentage": 79.13, "elapsed_time": "15:51:11", "remaining_time": "4:10:48"} +{"current_steps": 5600, "total_steps": 7064, "loss": 0.7912, "reward": null, "learning_rate": 5.114390779505557e-06, "epoch": 1.59, "percentage": 79.28, "elapsed_time": "15:49:00", "remaining_time": "4:08:05"} +{"current_steps": 5600, "total_steps": 7064, "loss": 0.7912, "reward": null, "learning_rate": 5.114390779505557e-06, "epoch": 1.59, "percentage": 79.28, "elapsed_time": "15:48:58", "remaining_time": "4:08:05"} +{"current_steps": 5600, "total_steps": 7064, "loss": 0.7912, "reward": null, "learning_rate": 5.114390779505557e-06, "epoch": 1.59, "percentage": 79.28, "elapsed_time": "15:52:51", "remaining_time": "4:09:06"} +{"current_steps": 5600, "total_steps": 7064, "loss": 0.7912, "reward": null, "learning_rate": 5.114390779505557e-06, "epoch": 1.59, "percentage": 79.28, "elapsed_time": "15:48:58", "remaining_time": "4:08:05"} +{"current_steps": 5610, "total_steps": 7064, "loss": 0.7917, "reward": null, "learning_rate": 5.047204757280072e-06, "epoch": 1.59, "percentage": 79.42, "elapsed_time": "15:50:37", "remaining_time": "4:06:22"} +{"current_steps": 5610, "total_steps": 7064, "loss": 0.7917, "reward": null, "learning_rate": 5.047204757280072e-06, "epoch": 1.59, "percentage": 79.42, "elapsed_time": "15:50:39", "remaining_time": "4:06:23"} +{"current_steps": 5610, "total_steps": 7064, "loss": 0.7917, "reward": null, "learning_rate": 5.047204757280072e-06, "epoch": 1.59, "percentage": 79.42, "elapsed_time": "15:50:38", "remaining_time": "4:06:23"} +{"current_steps": 5610, "total_steps": 7064, "loss": 0.7917, "reward": null, "learning_rate": 5.047204757280072e-06, "epoch": 1.59, "percentage": 79.42, "elapsed_time": "15:54:30", "remaining_time": "4:07:23"} +{"current_steps": 5620, "total_steps": 7064, "loss": 0.7922, "reward": null, "learning_rate": 4.980413375319737e-06, "epoch": 1.59, "percentage": 79.56, "elapsed_time": "15:56:15", "remaining_time": "4:05:41"} +{"current_steps": 5620, "total_steps": 7064, "loss": 0.7922, "reward": null, "learning_rate": 4.980413375319737e-06, "epoch": 1.59, "percentage": 79.56, "elapsed_time": "15:52:23", "remaining_time": "4:04:42"} +{"current_steps": 5620, "total_steps": 7064, "loss": 0.7922, "reward": null, "learning_rate": 4.980413375319737e-06, "epoch": 1.59, "percentage": 79.56, "elapsed_time": "15:52:22", "remaining_time": "4:04:42"} +{"current_steps": 5620, "total_steps": 7064, "loss": 0.7922, "reward": null, "learning_rate": 4.980413375319737e-06, "epoch": 1.59, "percentage": 79.56, "elapsed_time": "15:52:21", "remaining_time": "4:04:42"} +{"current_steps": 5630, "total_steps": 7064, "loss": 0.79, "reward": null, "learning_rate": 4.914017954670961e-06, "epoch": 1.59, "percentage": 79.7, "elapsed_time": "15:54:05", "remaining_time": "4:03:00"} +{"current_steps": 5630, "total_steps": 7064, "loss": 0.79, "reward": null, "learning_rate": 4.914017954670961e-06, "epoch": 1.59, "percentage": 79.7, "elapsed_time": "15:57:56", "remaining_time": "4:03:59"} +{"current_steps": 5630, "total_steps": 7064, "loss": 0.79, "reward": null, "learning_rate": 4.914017954670961e-06, "epoch": 1.59, "percentage": 79.7, "elapsed_time": "15:54:04", "remaining_time": "4:03:00"} +{"current_steps": 5630, "total_steps": 7064, "loss": 0.79, "reward": null, "learning_rate": 4.914017954670961e-06, "epoch": 1.59, "percentage": 79.7, "elapsed_time": "15:54:03", "remaining_time": "4:03:00"} +{"current_steps": 5640, "total_steps": 7064, "loss": 0.7844, "reward": null, "learning_rate": 4.8480198085485765e-06, "epoch": 1.6, "percentage": 79.84, "elapsed_time": "15:59:38", "remaining_time": "4:02:17"} +{"current_steps": 5640, "total_steps": 7064, "loss": 0.7844, "reward": null, "learning_rate": 4.8480198085485765e-06, "epoch": 1.6, "percentage": 79.84, "elapsed_time": "15:55:46", "remaining_time": "4:01:19"} +{"current_steps": 5640, "total_steps": 7064, "loss": 0.7844, "reward": null, "learning_rate": 4.8480198085485765e-06, "epoch": 1.6, "percentage": 79.84, "elapsed_time": "15:55:45", "remaining_time": "4:01:18"} +{"current_steps": 5640, "total_steps": 7064, "loss": 0.7844, "reward": null, "learning_rate": 4.8480198085485765e-06, "epoch": 1.6, "percentage": 79.84, "elapsed_time": "15:55:44", "remaining_time": "4:01:18"} +{"current_steps": 5650, "total_steps": 7064, "loss": 0.7855, "reward": null, "learning_rate": 4.782420242309821e-06, "epoch": 1.6, "percentage": 79.98, "elapsed_time": "16:01:18", "remaining_time": "4:00:34"} +{"current_steps": 5650, "total_steps": 7064, "loss": 0.7855, "reward": null, "learning_rate": 4.782420242309821e-06, "epoch": 1.6, "percentage": 79.98, "elapsed_time": "15:57:25", "remaining_time": "3:59:36"} +{"current_steps": 5650, "total_steps": 7064, "loss": 0.7855, "reward": null, "learning_rate": 4.782420242309821e-06, "epoch": 1.6, "percentage": 79.98, "elapsed_time": "15:57:26", "remaining_time": "3:59:36"} +{"current_steps": 5650, "total_steps": 7064, "loss": 0.7855, "reward": null, "learning_rate": 4.782420242309821e-06, "epoch": 1.6, "percentage": 79.98, "elapsed_time": "15:57:24", "remaining_time": "3:59:36"} +{"current_steps": 5660, "total_steps": 7064, "loss": 0.779, "reward": null, "learning_rate": 4.717220553428559e-06, "epoch": 1.6, "percentage": 80.12, "elapsed_time": "15:59:05", "remaining_time": "3:57:54"} +{"current_steps": 5660, "total_steps": 7064, "loss": 0.779, "reward": null, "learning_rate": 4.717220553428559e-06, "epoch": 1.6, "percentage": 80.12, "elapsed_time": "15:59:04", "remaining_time": "3:57:54"} +{"current_steps": 5660, "total_steps": 7064, "loss": 0.779, "reward": null, "learning_rate": 4.717220553428559e-06, "epoch": 1.6, "percentage": 80.12, "elapsed_time": "15:59:03", "remaining_time": "3:57:54"} +{"current_steps": 5660, "total_steps": 7064, "loss": 0.779, "reward": null, "learning_rate": 4.717220553428559e-06, "epoch": 1.6, "percentage": 80.12, "elapsed_time": "16:02:56", "remaining_time": "3:58:51"} +{"current_steps": 5670, "total_steps": 7064, "loss": 0.7864, "reward": null, "learning_rate": 4.652422031469583e-06, "epoch": 1.61, "percentage": 80.27, "elapsed_time": "16:04:39", "remaining_time": "3:57:10"} +{"current_steps": 5670, "total_steps": 7064, "loss": 0.7864, "reward": null, "learning_rate": 4.652422031469583e-06, "epoch": 1.61, "percentage": 80.27, "elapsed_time": "16:00:47", "remaining_time": "3:56:12"} +{"current_steps": 5670, "total_steps": 7064, "loss": 0.7864, "reward": null, "learning_rate": 4.652422031469583e-06, "epoch": 1.61, "percentage": 80.27, "elapsed_time": "16:00:46", "remaining_time": "3:56:12"} +{"current_steps": 5670, "total_steps": 7064, "loss": 0.7864, "reward": null, "learning_rate": 4.652422031469583e-06, "epoch": 1.61, "percentage": 80.27, "elapsed_time": "16:00:48", "remaining_time": "3:56:13"} +{"current_steps": 5680, "total_steps": 7064, "loss": 0.7802, "reward": null, "learning_rate": 4.58802595806315e-06, "epoch": 1.61, "percentage": 80.41, "elapsed_time": "16:02:30", "remaining_time": "3:54:31"} +{"current_steps": 5680, "total_steps": 7064, "loss": 0.7802, "reward": null, "learning_rate": 4.58802595806315e-06, "epoch": 1.61, "percentage": 80.41, "elapsed_time": "16:06:22", "remaining_time": "3:55:28"} +{"current_steps": 5680, "total_steps": 7064, "loss": 0.7802, "reward": null, "learning_rate": 4.58802595806315e-06, "epoch": 1.61, "percentage": 80.41, "elapsed_time": "16:02:29", "remaining_time": "3:54:31"} +{"current_steps": 5680, "total_steps": 7064, "loss": 0.7802, "reward": null, "learning_rate": 4.58802595806315e-06, "epoch": 1.61, "percentage": 80.41, "elapsed_time": "16:02:28", "remaining_time": "3:54:31"} +{"current_steps": 5690, "total_steps": 7064, "loss": 0.7776, "reward": null, "learning_rate": 4.524033606879602e-06, "epoch": 1.61, "percentage": 80.55, "elapsed_time": "16:04:13", "remaining_time": "3:52:50"} +{"current_steps": 5690, "total_steps": 7064, "loss": 0.7776, "reward": null, "learning_rate": 4.524033606879602e-06, "epoch": 1.61, "percentage": 80.55, "elapsed_time": "16:08:04", "remaining_time": "3:53:45"} +{"current_steps": 5690, "total_steps": 7064, "loss": 0.7776, "reward": null, "learning_rate": 4.524033606879602e-06, "epoch": 1.61, "percentage": 80.55, "elapsed_time": "16:04:11", "remaining_time": "3:52:49"} +{"current_steps": 5690, "total_steps": 7064, "loss": 0.7776, "reward": null, "learning_rate": 4.524033606879602e-06, "epoch": 1.61, "percentage": 80.55, "elapsed_time": "16:04:11", "remaining_time": "3:52:49"} +{"current_steps": 5700, "total_steps": 7064, "loss": 0.778, "reward": null, "learning_rate": 4.460446243604169e-06, "epoch": 1.61, "percentage": 80.69, "elapsed_time": "16:05:52", "remaining_time": "3:51:07"} +{"current_steps": 5700, "total_steps": 7064, "loss": 0.778, "reward": null, "learning_rate": 4.460446243604169e-06, "epoch": 1.61, "percentage": 80.69, "elapsed_time": "16:09:45", "remaining_time": "3:52:03"} +{"current_steps": 5700, "total_steps": 7064, "loss": 0.778, "reward": null, "learning_rate": 4.460446243604169e-06, "epoch": 1.61, "percentage": 80.69, "elapsed_time": "16:05:54", "remaining_time": "3:51:08"} +{"current_steps": 5700, "total_steps": 7064, "loss": 0.778, "reward": null, "learning_rate": 4.460446243604169e-06, "epoch": 1.61, "percentage": 80.69, "elapsed_time": "16:05:53", "remaining_time": "3:51:08"} +{"current_steps": 5710, "total_steps": 7064, "loss": 0.7834, "reward": null, "learning_rate": 4.3972651259119706e-06, "epoch": 1.62, "percentage": 80.83, "elapsed_time": "16:07:30", "remaining_time": "3:49:25"} +{"current_steps": 5710, "total_steps": 7064, "loss": 0.7834, "reward": null, "learning_rate": 4.3972651259119706e-06, "epoch": 1.62, "percentage": 80.83, "elapsed_time": "16:11:21", "remaining_time": "3:50:20"} +{"current_steps": 5710, "total_steps": 7064, "loss": 0.7834, "reward": null, "learning_rate": 4.3972651259119706e-06, "epoch": 1.62, "percentage": 80.83, "elapsed_time": "16:07:28", "remaining_time": "3:49:24"} +{"current_steps": 5710, "total_steps": 7064, "loss": 0.7834, "reward": null, "learning_rate": 4.3972651259119706e-06, "epoch": 1.62, "percentage": 80.83, "elapsed_time": "16:07:29", "remaining_time": "3:49:25"} +{"current_steps": 5720, "total_steps": 7064, "loss": 0.7875, "reward": null, "learning_rate": 4.3344915034431e-06, "epoch": 1.62, "percentage": 80.97, "elapsed_time": "16:09:12", "remaining_time": "3:47:43"} +{"current_steps": 5720, "total_steps": 7064, "loss": 0.7875, "reward": null, "learning_rate": 4.3344915034431e-06, "epoch": 1.62, "percentage": 80.97, "elapsed_time": "16:09:10", "remaining_time": "3:47:43"} +{"current_steps": 5720, "total_steps": 7064, "loss": 0.7875, "reward": null, "learning_rate": 4.3344915034431e-06, "epoch": 1.62, "percentage": 80.97, "elapsed_time": "16:09:11", "remaining_time": "3:47:43"} +{"current_steps": 5720, "total_steps": 7064, "loss": 0.7875, "reward": null, "learning_rate": 4.3344915034431e-06, "epoch": 1.62, "percentage": 80.97, "elapsed_time": "16:13:04", "remaining_time": "3:48:38"} +{"current_steps": 5730, "total_steps": 7064, "loss": 0.787, "reward": null, "learning_rate": 4.272126617777933e-06, "epoch": 1.62, "percentage": 81.12, "elapsed_time": "16:14:45", "remaining_time": "3:46:56"} +{"current_steps": 5730, "total_steps": 7064, "loss": 0.787, "reward": null, "learning_rate": 4.272126617777933e-06, "epoch": 1.62, "percentage": 81.12, "elapsed_time": "16:10:54", "remaining_time": "3:46:02"} +{"current_steps": 5730, "total_steps": 7064, "loss": 0.787, "reward": null, "learning_rate": 4.272126617777933e-06, "epoch": 1.62, "percentage": 81.12, "elapsed_time": "16:10:53", "remaining_time": "3:46:01"} +{"current_steps": 5730, "total_steps": 7064, "loss": 0.787, "reward": null, "learning_rate": 4.272126617777933e-06, "epoch": 1.62, "percentage": 81.12, "elapsed_time": "16:10:52", "remaining_time": "3:46:01"} +{"current_steps": 5740, "total_steps": 7064, "loss": 0.7773, "reward": null, "learning_rate": 4.2101717024125576e-06, "epoch": 1.63, "percentage": 81.26, "elapsed_time": "16:16:30", "remaining_time": "3:45:14"} +{"current_steps": 5740, "total_steps": 7064, "loss": 0.7773, "reward": null, "learning_rate": 4.2101717024125576e-06, "epoch": 1.63, "percentage": 81.26, "elapsed_time": "16:12:39", "remaining_time": "3:44:21"} +{"current_steps": 5740, "total_steps": 7064, "loss": 0.7773, "reward": null, "learning_rate": 4.2101717024125576e-06, "epoch": 1.63, "percentage": 81.26, "elapsed_time": "16:12:38", "remaining_time": "3:44:21"} +{"current_steps": 5740, "total_steps": 7064, "loss": 0.7773, "reward": null, "learning_rate": 4.2101717024125576e-06, "epoch": 1.63, "percentage": 81.26, "elapsed_time": "16:12:37", "remaining_time": "3:44:20"} +{"current_steps": 5750, "total_steps": 7064, "loss": 0.7853, "reward": null, "learning_rate": 4.148627982734404e-06, "epoch": 1.63, "percentage": 81.4, "elapsed_time": "16:18:09", "remaining_time": "3:43:31"} +{"current_steps": 5750, "total_steps": 7064, "loss": 0.7853, "reward": null, "learning_rate": 4.148627982734404e-06, "epoch": 1.63, "percentage": 81.4, "elapsed_time": "16:14:18", "remaining_time": "3:42:39"} +{"current_steps": 5750, "total_steps": 7064, "loss": 0.7853, "reward": null, "learning_rate": 4.148627982734404e-06, "epoch": 1.63, "percentage": 81.4, "elapsed_time": "16:14:17", "remaining_time": "3:42:38"} +{"current_steps": 5750, "total_steps": 7064, "loss": 0.7853, "reward": null, "learning_rate": 4.148627982734404e-06, "epoch": 1.63, "percentage": 81.4, "elapsed_time": "16:14:16", "remaining_time": "3:42:38"} +{"current_steps": 5760, "total_steps": 7064, "loss": 0.7917, "reward": null, "learning_rate": 4.087496675997965e-06, "epoch": 1.63, "percentage": 81.54, "elapsed_time": "16:19:49", "remaining_time": "3:41:49"} +{"current_steps": 5760, "total_steps": 7064, "loss": 0.7917, "reward": null, "learning_rate": 4.087496675997965e-06, "epoch": 1.63, "percentage": 81.54, "elapsed_time": "16:15:58", "remaining_time": "3:40:56"} +{"current_steps": 5760, "total_steps": 7064, "loss": 0.7917, "reward": null, "learning_rate": 4.087496675997965e-06, "epoch": 1.63, "percentage": 81.54, "elapsed_time": "16:15:56", "remaining_time": "3:40:56"} +{"current_steps": 5760, "total_steps": 7064, "loss": 0.7917, "reward": null, "learning_rate": 4.087496675997965e-06, "epoch": 1.63, "percentage": 81.54, "elapsed_time": "16:15:57", "remaining_time": "3:40:56"} +{"current_steps": 5770, "total_steps": 7064, "loss": 0.7907, "reward": null, "learning_rate": 4.026778991300762e-06, "epoch": 1.63, "percentage": 81.68, "elapsed_time": "16:17:39", "remaining_time": "3:39:15"} +{"current_steps": 5770, "total_steps": 7064, "loss": 0.7907, "reward": null, "learning_rate": 4.026778991300762e-06, "epoch": 1.63, "percentage": 81.68, "elapsed_time": "16:17:40", "remaining_time": "3:39:15"} +{"current_steps": 5770, "total_steps": 7064, "loss": 0.7907, "reward": null, "learning_rate": 4.026778991300762e-06, "epoch": 1.63, "percentage": 81.68, "elapsed_time": "16:21:32", "remaining_time": "3:40:07"} +{"current_steps": 5770, "total_steps": 7064, "loss": 0.7907, "reward": null, "learning_rate": 4.026778991300762e-06, "epoch": 1.63, "percentage": 81.68, "elapsed_time": "16:17:41", "remaining_time": "3:39:15"} +{"current_steps": 5780, "total_steps": 7064, "loss": 0.7764, "reward": null, "learning_rate": 3.966476129559391e-06, "epoch": 1.64, "percentage": 81.82, "elapsed_time": "16:23:12", "remaining_time": "3:38:24"} +{"current_steps": 5780, "total_steps": 7064, "loss": 0.7764, "reward": null, "learning_rate": 3.966476129559391e-06, "epoch": 1.64, "percentage": 81.82, "elapsed_time": "16:19:21", "remaining_time": "3:37:33"} +{"current_steps": 5780, "total_steps": 7064, "loss": 0.7764, "reward": null, "learning_rate": 3.966476129559391e-06, "epoch": 1.64, "percentage": 81.82, "elapsed_time": "16:19:19", "remaining_time": "3:37:33"} +{"current_steps": 5780, "total_steps": 7064, "loss": 0.7764, "reward": null, "learning_rate": 3.966476129559391e-06, "epoch": 1.64, "percentage": 81.82, "elapsed_time": "16:19:20", "remaining_time": "3:37:33"} +{"current_steps": 5790, "total_steps": 7064, "loss": 0.7718, "reward": null, "learning_rate": 3.90658928348582e-06, "epoch": 1.64, "percentage": 81.96, "elapsed_time": "16:21:02", "remaining_time": "3:35:51"} +{"current_steps": 5790, "total_steps": 7064, "loss": 0.7718, "reward": null, "learning_rate": 3.90658928348582e-06, "epoch": 1.64, "percentage": 81.96, "elapsed_time": "16:21:00", "remaining_time": "3:35:51"} +{"current_steps": 5790, "total_steps": 7064, "loss": 0.7718, "reward": null, "learning_rate": 3.90658928348582e-06, "epoch": 1.64, "percentage": 81.96, "elapsed_time": "16:21:01", "remaining_time": "3:35:51"} +{"current_steps": 5790, "total_steps": 7064, "loss": 0.7718, "reward": null, "learning_rate": 3.90658928348582e-06, "epoch": 1.64, "percentage": 81.96, "elapsed_time": "16:24:53", "remaining_time": "3:36:42"} +{"current_steps": 5800, "total_steps": 7064, "loss": 0.791, "reward": null, "learning_rate": 3.847119637563739e-06, "epoch": 1.64, "percentage": 82.11, "elapsed_time": "16:22:42", "remaining_time": "3:34:09"} +{"current_steps": 5800, "total_steps": 7064, "loss": 0.791, "reward": null, "learning_rate": 3.847119637563739e-06, "epoch": 1.64, "percentage": 82.11, "elapsed_time": "16:22:41", "remaining_time": "3:34:09"} +{"current_steps": 5800, "total_steps": 7064, "loss": 0.791, "reward": null, "learning_rate": 3.847119637563739e-06, "epoch": 1.64, "percentage": 82.11, "elapsed_time": "16:22:40", "remaining_time": "3:34:09"} +{"current_steps": 5800, "total_steps": 7064, "loss": 0.791, "reward": null, "learning_rate": 3.847119637563739e-06, "epoch": 1.64, "percentage": 82.11, "elapsed_time": "16:26:33", "remaining_time": "3:35:00"} +{"current_steps": 5810, "total_steps": 7064, "loss": 0.7732, "reward": null, "learning_rate": 3.7880683680251855e-06, "epoch": 1.64, "percentage": 82.25, "elapsed_time": "16:24:24", "remaining_time": "3:32:28"} +{"current_steps": 5810, "total_steps": 7064, "loss": 0.7732, "reward": null, "learning_rate": 3.7880683680251855e-06, "epoch": 1.64, "percentage": 82.25, "elapsed_time": "16:28:15", "remaining_time": "3:33:18"} +{"current_steps": 5810, "total_steps": 7064, "loss": 0.7732, "reward": null, "learning_rate": 3.7880683680251855e-06, "epoch": 1.64, "percentage": 82.25, "elapsed_time": "16:24:22", "remaining_time": "3:32:27"} +{"current_steps": 5810, "total_steps": 7064, "loss": 0.7732, "reward": null, "learning_rate": 3.7880683680251855e-06, "epoch": 1.64, "percentage": 82.25, "elapsed_time": "16:24:23", "remaining_time": "3:32:27"} +{"current_steps": 5820, "total_steps": 7064, "loss": 0.7621, "reward": null, "learning_rate": 3.7294366428272386e-06, "epoch": 1.65, "percentage": 82.39, "elapsed_time": "16:30:00", "remaining_time": "3:31:36"} +{"current_steps": 5820, "total_steps": 7064, "loss": 0.7621, "reward": null, "learning_rate": 3.7294366428272386e-06, "epoch": 1.65, "percentage": 82.39, "elapsed_time": "16:26:09", "remaining_time": "3:30:47"} +{"current_steps": 5820, "total_steps": 7064, "loss": 0.7621, "reward": null, "learning_rate": 3.7294366428272386e-06, "epoch": 1.65, "percentage": 82.39, "elapsed_time": "16:26:07", "remaining_time": "3:30:46"} +{"current_steps": 5820, "total_steps": 7064, "loss": 0.7621, "reward": null, "learning_rate": 3.7294366428272386e-06, "epoch": 1.65, "percentage": 82.39, "elapsed_time": "16:26:08", "remaining_time": "3:30:46"} +{"current_steps": 5830, "total_steps": 7064, "loss": 0.7619, "reward": null, "learning_rate": 3.6712256216289624e-06, "epoch": 1.65, "percentage": 82.53, "elapsed_time": "16:27:51", "remaining_time": "3:29:05"} +{"current_steps": 5830, "total_steps": 7064, "loss": 0.7619, "reward": null, "learning_rate": 3.6712256216289624e-06, "epoch": 1.65, "percentage": 82.53, "elapsed_time": "16:31:42", "remaining_time": "3:29:54"} +{"current_steps": 5830, "total_steps": 7064, "loss": 0.7619, "reward": null, "learning_rate": 3.6712256216289624e-06, "epoch": 1.65, "percentage": 82.53, "elapsed_time": "16:27:50", "remaining_time": "3:29:05"} +{"current_steps": 5830, "total_steps": 7064, "loss": 0.7619, "reward": null, "learning_rate": 3.6712256216289624e-06, "epoch": 1.65, "percentage": 82.53, "elapsed_time": "16:27:49", "remaining_time": "3:29:05"} +{"current_steps": 5840, "total_steps": 7064, "loss": 0.782, "reward": null, "learning_rate": 3.613436455768418e-06, "epoch": 1.65, "percentage": 82.67, "elapsed_time": "16:33:23", "remaining_time": "3:28:12"} +{"current_steps": 5840, "total_steps": 7064, "loss": 0.782, "reward": null, "learning_rate": 3.613436455768418e-06, "epoch": 1.65, "percentage": 82.67, "elapsed_time": "16:29:31", "remaining_time": "3:27:23"} +{"current_steps": 5840, "total_steps": 7064, "loss": 0.782, "reward": null, "learning_rate": 3.613436455768418e-06, "epoch": 1.65, "percentage": 82.67, "elapsed_time": "16:29:30", "remaining_time": "3:27:23"} +{"current_steps": 5840, "total_steps": 7064, "loss": 0.782, "reward": null, "learning_rate": 3.613436455768418e-06, "epoch": 1.65, "percentage": 82.67, "elapsed_time": "16:29:29", "remaining_time": "3:27:23"} +{"current_steps": 5850, "total_steps": 7064, "loss": 0.7853, "reward": null, "learning_rate": 3.5560702882399406e-06, "epoch": 1.66, "percentage": 82.81, "elapsed_time": "16:31:07", "remaining_time": "3:25:40"} +{"current_steps": 5850, "total_steps": 7064, "loss": 0.7853, "reward": null, "learning_rate": 3.5560702882399406e-06, "epoch": 1.66, "percentage": 82.81, "elapsed_time": "16:31:09", "remaining_time": "3:25:41"} +{"current_steps": 5850, "total_steps": 7064, "loss": 0.7853, "reward": null, "learning_rate": 3.5560702882399406e-06, "epoch": 1.66, "percentage": 82.81, "elapsed_time": "16:31:08", "remaining_time": "3:25:40"} +{"current_steps": 5850, "total_steps": 7064, "loss": 0.7853, "reward": null, "learning_rate": 3.5560702882399406e-06, "epoch": 1.66, "percentage": 82.81, "elapsed_time": "16:35:00", "remaining_time": "3:26:29"} +{"current_steps": 5860, "total_steps": 7064, "loss": 0.7896, "reward": null, "learning_rate": 3.499128253671494e-06, "epoch": 1.66, "percentage": 82.96, "elapsed_time": "16:32:48", "remaining_time": "3:23:59"} +{"current_steps": 5860, "total_steps": 7064, "loss": 0.7896, "reward": null, "learning_rate": 3.499128253671494e-06, "epoch": 1.66, "percentage": 82.96, "elapsed_time": "16:36:39", "remaining_time": "3:24:46"} +{"current_steps": 5860, "total_steps": 7064, "loss": 0.7896, "reward": null, "learning_rate": 3.499128253671494e-06, "epoch": 1.66, "percentage": 82.96, "elapsed_time": "16:32:46", "remaining_time": "3:23:58"} +{"current_steps": 5860, "total_steps": 7064, "loss": 0.7896, "reward": null, "learning_rate": 3.499128253671494e-06, "epoch": 1.66, "percentage": 82.96, "elapsed_time": "16:32:47", "remaining_time": "3:23:58"} +{"current_steps": 5870, "total_steps": 7064, "loss": 0.7939, "reward": null, "learning_rate": 3.4426114783022546e-06, "epoch": 1.66, "percentage": 83.1, "elapsed_time": "16:34:32", "remaining_time": "3:22:17"} +{"current_steps": 5870, "total_steps": 7064, "loss": 0.7939, "reward": null, "learning_rate": 3.4426114783022546e-06, "epoch": 1.66, "percentage": 83.1, "elapsed_time": "16:34:31", "remaining_time": "3:22:17"} +{"current_steps": 5870, "total_steps": 7064, "loss": 0.7939, "reward": null, "learning_rate": 3.4426114783022546e-06, "epoch": 1.66, "percentage": 83.1, "elapsed_time": "16:34:30", "remaining_time": "3:22:17"} +{"current_steps": 5870, "total_steps": 7064, "loss": 0.7939, "reward": null, "learning_rate": 3.4426114783022546e-06, "epoch": 1.66, "percentage": 83.1, "elapsed_time": "16:38:24", "remaining_time": "3:23:04"} +{"current_steps": 5880, "total_steps": 7064, "loss": 0.7734, "reward": null, "learning_rate": 3.3865210799603253e-06, "epoch": 1.66, "percentage": 83.24, "elapsed_time": "16:40:07", "remaining_time": "3:21:23"} +{"current_steps": 5880, "total_steps": 7064, "loss": 0.7734, "reward": null, "learning_rate": 3.3865210799603253e-06, "epoch": 1.66, "percentage": 83.24, "elapsed_time": "16:36:14", "remaining_time": "3:20:36"} +{"current_steps": 5880, "total_steps": 7064, "loss": 0.7734, "reward": null, "learning_rate": 3.3865210799603253e-06, "epoch": 1.66, "percentage": 83.24, "elapsed_time": "16:36:15", "remaining_time": "3:20:36"} +{"current_steps": 5880, "total_steps": 7064, "loss": 0.7734, "reward": null, "learning_rate": 3.3865210799603253e-06, "epoch": 1.66, "percentage": 83.24, "elapsed_time": "16:36:16", "remaining_time": "3:20:36"} +{"current_steps": 5890, "total_steps": 7064, "loss": 0.7951, "reward": null, "learning_rate": 3.3308581680406182e-06, "epoch": 1.67, "percentage": 83.38, "elapsed_time": "16:41:51", "remaining_time": "3:19:41"} +{"current_steps": 5890, "total_steps": 7064, "loss": 0.7951, "reward": null, "learning_rate": 3.3308581680406182e-06, "epoch": 1.67, "percentage": 83.38, "elapsed_time": "16:37:57", "remaining_time": "3:18:54"} +{"current_steps": 5890, "total_steps": 7064, "loss": 0.7951, "reward": null, "learning_rate": 3.3308581680406182e-06, "epoch": 1.67, "percentage": 83.38, "elapsed_time": "16:37:58", "remaining_time": "3:18:55"} +{"current_steps": 5890, "total_steps": 7064, "loss": 0.7951, "reward": null, "learning_rate": 3.3308581680406182e-06, "epoch": 1.67, "percentage": 83.38, "elapsed_time": "16:37:59", "remaining_time": "3:18:55"} +{"current_steps": 5900, "total_steps": 7064, "loss": 0.7892, "reward": null, "learning_rate": 3.275623843482939e-06, "epoch": 1.67, "percentage": 83.52, "elapsed_time": "16:39:42", "remaining_time": "3:17:13"} +{"current_steps": 5900, "total_steps": 7064, "loss": 0.7892, "reward": null, "learning_rate": 3.275623843482939e-06, "epoch": 1.67, "percentage": 83.52, "elapsed_time": "16:39:41", "remaining_time": "3:17:13"} +{"current_steps": 5900, "total_steps": 7064, "loss": 0.7892, "reward": null, "learning_rate": 3.275623843482939e-06, "epoch": 1.67, "percentage": 83.52, "elapsed_time": "16:39:40", "remaining_time": "3:17:13"} +{"current_steps": 5900, "total_steps": 7064, "loss": 0.7892, "reward": null, "learning_rate": 3.275623843482939e-06, "epoch": 1.67, "percentage": 83.52, "elapsed_time": "16:43:33", "remaining_time": "3:17:59"} +{"current_steps": 5910, "total_steps": 7064, "loss": 0.7788, "reward": null, "learning_rate": 3.220819198750172e-06, "epoch": 1.67, "percentage": 83.66, "elapsed_time": "16:41:24", "remaining_time": "3:15:32"} +{"current_steps": 5910, "total_steps": 7064, "loss": 0.7788, "reward": null, "learning_rate": 3.220819198750172e-06, "epoch": 1.67, "percentage": 83.66, "elapsed_time": "16:45:15", "remaining_time": "3:16:17"} +{"current_steps": 5910, "total_steps": 7064, "loss": 0.7788, "reward": null, "learning_rate": 3.220819198750172e-06, "epoch": 1.67, "percentage": 83.66, "elapsed_time": "16:41:23", "remaining_time": "3:15:32"} +{"current_steps": 5910, "total_steps": 7064, "loss": 0.7788, "reward": null, "learning_rate": 3.220819198750172e-06, "epoch": 1.67, "percentage": 83.66, "elapsed_time": "16:41:22", "remaining_time": "3:15:31"} +{"current_steps": 5920, "total_steps": 7064, "loss": 0.8137, "reward": null, "learning_rate": 3.166445317806721e-06, "epoch": 1.68, "percentage": 83.81, "elapsed_time": "16:47:02", "remaining_time": "3:14:36"} +{"current_steps": 5920, "total_steps": 7064, "loss": 0.8137, "reward": null, "learning_rate": 3.166445317806721e-06, "epoch": 1.68, "percentage": 83.81, "elapsed_time": "16:43:10", "remaining_time": "3:13:51"} +{"current_steps": 5920, "total_steps": 7064, "loss": 0.8137, "reward": null, "learning_rate": 3.166445317806721e-06, "epoch": 1.68, "percentage": 83.81, "elapsed_time": "16:43:08", "remaining_time": "3:13:51"} +{"current_steps": 5920, "total_steps": 7064, "loss": 0.8137, "reward": null, "learning_rate": 3.166445317806721e-06, "epoch": 1.68, "percentage": 83.81, "elapsed_time": "16:43:09", "remaining_time": "3:13:51"} +{"current_steps": 5930, "total_steps": 7064, "loss": 0.7665, "reward": null, "learning_rate": 3.1125032760970203e-06, "epoch": 1.68, "percentage": 83.95, "elapsed_time": "16:48:42", "remaining_time": "3:12:53"} +{"current_steps": 5930, "total_steps": 7064, "loss": 0.7665, "reward": null, "learning_rate": 3.1125032760970203e-06, "epoch": 1.68, "percentage": 83.95, "elapsed_time": "16:44:49", "remaining_time": "3:12:09"} +{"current_steps": 5930, "total_steps": 7064, "loss": 0.7665, "reward": null, "learning_rate": 3.1125032760970203e-06, "epoch": 1.68, "percentage": 83.95, "elapsed_time": "16:44:51", "remaining_time": "3:12:09"} +{"current_steps": 5930, "total_steps": 7064, "loss": 0.7665, "reward": null, "learning_rate": 3.1125032760970203e-06, "epoch": 1.68, "percentage": 83.95, "elapsed_time": "16:44:50", "remaining_time": "3:12:09"} +{"current_steps": 5940, "total_steps": 7064, "loss": 0.7812, "reward": null, "learning_rate": 3.0589941405243043e-06, "epoch": 1.68, "percentage": 84.09, "elapsed_time": "16:46:33", "remaining_time": "3:10:27"} +{"current_steps": 5940, "total_steps": 7064, "loss": 0.7812, "reward": null, "learning_rate": 3.0589941405243043e-06, "epoch": 1.68, "percentage": 84.09, "elapsed_time": "16:46:32", "remaining_time": "3:10:27"} +{"current_steps": 5940, "total_steps": 7064, "loss": 0.7812, "reward": null, "learning_rate": 3.0589941405243043e-06, "epoch": 1.68, "percentage": 84.09, "elapsed_time": "16:46:31", "remaining_time": "3:10:27"} +{"current_steps": 5940, "total_steps": 7064, "loss": 0.7812, "reward": null, "learning_rate": 3.0589941405243043e-06, "epoch": 1.68, "percentage": 84.09, "elapsed_time": "16:50:24", "remaining_time": "3:11:11"} +{"current_steps": 5950, "total_steps": 7064, "loss": 0.7824, "reward": null, "learning_rate": 3.0059189694294774e-06, "epoch": 1.68, "percentage": 84.23, "elapsed_time": "16:48:13", "remaining_time": "3:08:45"} +{"current_steps": 5950, "total_steps": 7064, "loss": 0.7824, "reward": null, "learning_rate": 3.0059189694294774e-06, "epoch": 1.68, "percentage": 84.23, "elapsed_time": "16:52:04", "remaining_time": "3:09:29"} +{"current_steps": 5950, "total_steps": 7064, "loss": 0.7824, "reward": null, "learning_rate": 3.0059189694294774e-06, "epoch": 1.68, "percentage": 84.23, "elapsed_time": "16:48:11", "remaining_time": "3:08:45"} +{"current_steps": 5950, "total_steps": 7064, "loss": 0.7824, "reward": null, "learning_rate": 3.0059189694294774e-06, "epoch": 1.68, "percentage": 84.23, "elapsed_time": "16:48:11", "remaining_time": "3:08:45"} +{"current_steps": 5960, "total_steps": 7064, "loss": 0.7736, "reward": null, "learning_rate": 2.953278812570201e-06, "epoch": 1.69, "percentage": 84.37, "elapsed_time": "16:49:56", "remaining_time": "3:07:04"} +{"current_steps": 5960, "total_steps": 7064, "loss": 0.7736, "reward": null, "learning_rate": 2.953278812570201e-06, "epoch": 1.69, "percentage": 84.37, "elapsed_time": "16:53:47", "remaining_time": "3:07:47"} +{"current_steps": 5960, "total_steps": 7064, "loss": 0.7736, "reward": null, "learning_rate": 2.953278812570201e-06, "epoch": 1.69, "percentage": 84.37, "elapsed_time": "16:49:55", "remaining_time": "3:07:04"} +{"current_steps": 5960, "total_steps": 7064, "loss": 0.7736, "reward": null, "learning_rate": 2.953278812570201e-06, "epoch": 1.69, "percentage": 84.37, "elapsed_time": "16:49:54", "remaining_time": "3:07:04"} +{"current_steps": 5970, "total_steps": 7064, "loss": 0.7759, "reward": null, "learning_rate": 2.9010747111001103e-06, "epoch": 1.69, "percentage": 84.51, "elapsed_time": "16:51:40", "remaining_time": "3:05:23"} +{"current_steps": 5970, "total_steps": 7064, "loss": 0.7759, "reward": null, "learning_rate": 2.9010747111001103e-06, "epoch": 1.69, "percentage": 84.51, "elapsed_time": "16:51:39", "remaining_time": "3:05:23"} +{"current_steps": 5970, "total_steps": 7064, "loss": 0.7759, "reward": null, "learning_rate": 2.9010747111001103e-06, "epoch": 1.69, "percentage": 84.51, "elapsed_time": "16:51:38", "remaining_time": "3:05:22"} +{"current_steps": 5970, "total_steps": 7064, "loss": 0.7759, "reward": null, "learning_rate": 2.9010747111001103e-06, "epoch": 1.69, "percentage": 84.51, "elapsed_time": "16:55:31", "remaining_time": "3:06:05"} +{"current_steps": 5980, "total_steps": 7064, "loss": 0.7946, "reward": null, "learning_rate": 2.849307697548251e-06, "epoch": 1.69, "percentage": 84.65, "elapsed_time": "16:53:22", "remaining_time": "3:03:41"} +{"current_steps": 5980, "total_steps": 7064, "loss": 0.7946, "reward": null, "learning_rate": 2.849307697548251e-06, "epoch": 1.69, "percentage": 84.65, "elapsed_time": "16:53:21", "remaining_time": "3:03:41"} +{"current_steps": 5980, "total_steps": 7064, "loss": 0.7946, "reward": null, "learning_rate": 2.849307697548251e-06, "epoch": 1.69, "percentage": 84.65, "elapsed_time": "16:53:20", "remaining_time": "3:03:41"} +{"current_steps": 5980, "total_steps": 7064, "loss": 0.7946, "reward": null, "learning_rate": 2.849307697548251e-06, "epoch": 1.69, "percentage": 84.65, "elapsed_time": "16:57:13", "remaining_time": "3:04:23"} +{"current_steps": 5990, "total_steps": 7064, "loss": 0.7938, "reward": null, "learning_rate": 2.7979787957986225e-06, "epoch": 1.7, "percentage": 84.8, "elapsed_time": "16:54:59", "remaining_time": "3:01:59"} +{"current_steps": 5990, "total_steps": 7064, "loss": 0.7938, "reward": null, "learning_rate": 2.7979787957986225e-06, "epoch": 1.7, "percentage": 84.8, "elapsed_time": "16:58:53", "remaining_time": "3:02:41"} +{"current_steps": 5990, "total_steps": 7064, "loss": 0.7938, "reward": null, "learning_rate": 2.7979787957986225e-06, "epoch": 1.7, "percentage": 84.8, "elapsed_time": "16:55:01", "remaining_time": "3:01:59"} +{"current_steps": 5990, "total_steps": 7064, "loss": 0.7938, "reward": null, "learning_rate": 2.7979787957986225e-06, "epoch": 1.7, "percentage": 84.8, "elapsed_time": "16:55:00", "remaining_time": "3:01:59"} +{"current_steps": 6000, "total_steps": 7064, "loss": 0.7818, "reward": null, "learning_rate": 2.7470890210699596e-06, "epoch": 1.7, "percentage": 84.94, "elapsed_time": "16:56:48", "remaining_time": "3:00:18"} +{"current_steps": 6000, "total_steps": 7064, "loss": 0.7818, "reward": null, "learning_rate": 2.7470890210699596e-06, "epoch": 1.7, "percentage": 84.94, "elapsed_time": "16:56:46", "remaining_time": "3:00:18"} +{"current_steps": 6000, "total_steps": 7064, "loss": 0.7818, "reward": null, "learning_rate": 2.7470890210699596e-06, "epoch": 1.7, "percentage": 84.94, "elapsed_time": "16:56:47", "remaining_time": "3:00:18"} +{"current_steps": 6000, "total_steps": 7064, "loss": 0.7818, "reward": null, "learning_rate": 2.7470890210699596e-06, "epoch": 1.7, "percentage": 84.94, "elapsed_time": "17:00:40", "remaining_time": "3:00:59"} +{"current_steps": 6010, "total_steps": 7064, "loss": 0.7773, "reward": null, "learning_rate": 2.6966393798956242e-06, "epoch": 1.7, "percentage": 85.08, "elapsed_time": "16:58:29", "remaining_time": "2:58:36"} +{"current_steps": 6010, "total_steps": 7064, "loss": 0.7773, "reward": null, "learning_rate": 2.6966393798956242e-06, "epoch": 1.7, "percentage": 85.08, "elapsed_time": "16:58:28", "remaining_time": "2:58:36"} +{"current_steps": 6010, "total_steps": 7064, "loss": 0.7773, "reward": null, "learning_rate": 2.6966393798956242e-06, "epoch": 1.7, "percentage": 85.08, "elapsed_time": "17:02:21", "remaining_time": "2:59:17"} +{"current_steps": 6010, "total_steps": 7064, "loss": 0.7773, "reward": null, "learning_rate": 2.6966393798956242e-06, "epoch": 1.7, "percentage": 85.08, "elapsed_time": "16:58:30", "remaining_time": "2:58:37"} +{"current_steps": 6020, "total_steps": 7064, "loss": 0.7779, "reward": null, "learning_rate": 2.6466308701037253e-06, "epoch": 1.7, "percentage": 85.22, "elapsed_time": "17:04:05", "remaining_time": "2:57:35"} +{"current_steps": 6020, "total_steps": 7064, "loss": 0.7779, "reward": null, "learning_rate": 2.6466308701037253e-06, "epoch": 1.7, "percentage": 85.22, "elapsed_time": "17:00:14", "remaining_time": "2:56:55"} +{"current_steps": 6020, "total_steps": 7064, "loss": 0.7779, "reward": null, "learning_rate": 2.6466308701037253e-06, "epoch": 1.7, "percentage": 85.22, "elapsed_time": "17:00:12", "remaining_time": "2:56:55"} +{"current_steps": 6020, "total_steps": 7064, "loss": 0.7779, "reward": null, "learning_rate": 2.6466308701037253e-06, "epoch": 1.7, "percentage": 85.22, "elapsed_time": "17:00:12", "remaining_time": "2:56:55"} +{"current_steps": 6030, "total_steps": 7064, "loss": 0.7981, "reward": null, "learning_rate": 2.597064480797351e-06, "epoch": 1.71, "percentage": 85.36, "elapsed_time": "17:01:55", "remaining_time": "2:55:14"} +{"current_steps": 6030, "total_steps": 7064, "loss": 0.7981, "reward": null, "learning_rate": 2.597064480797351e-06, "epoch": 1.71, "percentage": 85.36, "elapsed_time": "17:01:53", "remaining_time": "2:55:13"} +{"current_steps": 6030, "total_steps": 7064, "loss": 0.7981, "reward": null, "learning_rate": 2.597064480797351e-06, "epoch": 1.71, "percentage": 85.36, "elapsed_time": "17:01:54", "remaining_time": "2:55:14"} +{"current_steps": 6030, "total_steps": 7064, "loss": 0.7981, "reward": null, "learning_rate": 2.597064480797351e-06, "epoch": 1.71, "percentage": 85.36, "elapsed_time": "17:05:47", "remaining_time": "2:55:53"} +{"current_steps": 6040, "total_steps": 7064, "loss": 0.7881, "reward": null, "learning_rate": 2.547941192335035e-06, "epoch": 1.71, "percentage": 85.5, "elapsed_time": "17:03:38", "remaining_time": "2:53:32"} +{"current_steps": 6040, "total_steps": 7064, "loss": 0.7881, "reward": null, "learning_rate": 2.547941192335035e-06, "epoch": 1.71, "percentage": 85.5, "elapsed_time": "17:07:29", "remaining_time": "2:54:11"} +{"current_steps": 6040, "total_steps": 7064, "loss": 0.7881, "reward": null, "learning_rate": 2.547941192335035e-06, "epoch": 1.71, "percentage": 85.5, "elapsed_time": "17:03:36", "remaining_time": "2:53:32"} +{"current_steps": 6040, "total_steps": 7064, "loss": 0.7881, "reward": null, "learning_rate": 2.547941192335035e-06, "epoch": 1.71, "percentage": 85.5, "elapsed_time": "17:03:37", "remaining_time": "2:53:32"} +{"current_steps": 6050, "total_steps": 7064, "loss": 0.7772, "reward": null, "learning_rate": 2.4992619763113427e-06, "epoch": 1.71, "percentage": 85.65, "elapsed_time": "17:05:16", "remaining_time": "2:51:50"} +{"current_steps": 6050, "total_steps": 7064, "loss": 0.7772, "reward": null, "learning_rate": 2.4992619763113427e-06, "epoch": 1.71, "percentage": 85.65, "elapsed_time": "17:05:14", "remaining_time": "2:51:50"} +{"current_steps": 6050, "total_steps": 7064, "loss": 0.7772, "reward": null, "learning_rate": 2.4992619763113427e-06, "epoch": 1.71, "percentage": 85.65, "elapsed_time": "17:05:15", "remaining_time": "2:51:50"} +{"current_steps": 6050, "total_steps": 7064, "loss": 0.7772, "reward": null, "learning_rate": 2.4992619763113427e-06, "epoch": 1.71, "percentage": 85.65, "elapsed_time": "17:09:07", "remaining_time": "2:52:29"} +{"current_steps": 6060, "total_steps": 7064, "loss": 0.7812, "reward": null, "learning_rate": 2.4510277955376885e-06, "epoch": 1.72, "percentage": 85.79, "elapsed_time": "17:06:56", "remaining_time": "2:50:08"} +{"current_steps": 6060, "total_steps": 7064, "loss": 0.7812, "reward": null, "learning_rate": 2.4510277955376885e-06, "epoch": 1.72, "percentage": 85.79, "elapsed_time": "17:06:54", "remaining_time": "2:50:08"} +{"current_steps": 6060, "total_steps": 7064, "loss": 0.7812, "reward": null, "learning_rate": 2.4510277955376885e-06, "epoch": 1.72, "percentage": 85.79, "elapsed_time": "17:06:55", "remaining_time": "2:50:08"} +{"current_steps": 6060, "total_steps": 7064, "loss": 0.7812, "reward": null, "learning_rate": 2.4510277955376885e-06, "epoch": 1.72, "percentage": 85.79, "elapsed_time": "17:10:47", "remaining_time": "2:50:46"} +{"current_steps": 6070, "total_steps": 7064, "loss": 0.7753, "reward": null, "learning_rate": 2.403239604023244e-06, "epoch": 1.72, "percentage": 85.93, "elapsed_time": "17:08:39", "remaining_time": "2:48:26"} +{"current_steps": 6070, "total_steps": 7064, "loss": 0.7753, "reward": null, "learning_rate": 2.403239604023244e-06, "epoch": 1.72, "percentage": 85.93, "elapsed_time": "17:12:30", "remaining_time": "2:49:04"} +{"current_steps": 6070, "total_steps": 7064, "loss": 0.7753, "reward": null, "learning_rate": 2.403239604023244e-06, "epoch": 1.72, "percentage": 85.93, "elapsed_time": "17:08:38", "remaining_time": "2:48:26"} +{"current_steps": 6070, "total_steps": 7064, "loss": 0.7753, "reward": null, "learning_rate": 2.403239604023244e-06, "epoch": 1.72, "percentage": 85.93, "elapsed_time": "17:08:37", "remaining_time": "2:48:26"} +{"current_steps": 6080, "total_steps": 7064, "loss": 0.7778, "reward": null, "learning_rate": 2.360612333857401e-06, "epoch": 1.72, "percentage": 86.07, "elapsed_time": "17:10:20", "remaining_time": "2:46:45"} +{"current_steps": 6080, "total_steps": 7064, "loss": 0.7778, "reward": null, "learning_rate": 2.360612333857401e-06, "epoch": 1.72, "percentage": 86.07, "elapsed_time": "17:10:18", "remaining_time": "2:46:44"} +{"current_steps": 6080, "total_steps": 7064, "loss": 0.7778, "reward": null, "learning_rate": 2.360612333857401e-06, "epoch": 1.72, "percentage": 86.07, "elapsed_time": "17:14:11", "remaining_time": "2:47:22"} +{"current_steps": 6080, "total_steps": 7064, "loss": 0.7778, "reward": null, "learning_rate": 2.360612333857401e-06, "epoch": 1.72, "percentage": 86.07, "elapsed_time": "17:10:19", "remaining_time": "2:46:44"} +{"current_steps": 6090, "total_steps": 7064, "loss": 0.7883, "reward": null, "learning_rate": 2.31367411862298e-06, "epoch": 1.72, "percentage": 86.21, "elapsed_time": "17:15:49", "remaining_time": "2:45:39"} +{"current_steps": 6090, "total_steps": 7064, "loss": 0.7883, "reward": null, "learning_rate": 2.31367411862298e-06, "epoch": 1.72, "percentage": 86.21, "elapsed_time": "17:11:58", "remaining_time": "2:45:02"} +{"current_steps": 6090, "total_steps": 7064, "loss": 0.7883, "reward": null, "learning_rate": 2.31367411862298e-06, "epoch": 1.72, "percentage": 86.21, "elapsed_time": "17:11:57", "remaining_time": "2:45:02"} +{"current_steps": 6090, "total_steps": 7064, "loss": 0.7883, "reward": null, "learning_rate": 2.31367411862298e-06, "epoch": 1.72, "percentage": 86.21, "elapsed_time": "17:11:56", "remaining_time": "2:45:02"} +{"current_steps": 6100, "total_steps": 7064, "loss": 0.7885, "reward": null, "learning_rate": 2.2671846093243493e-06, "epoch": 1.73, "percentage": 86.35, "elapsed_time": "17:17:33", "remaining_time": "2:43:58"} +{"current_steps": 6100, "total_steps": 7064, "loss": 0.7885, "reward": null, "learning_rate": 2.2671846093243493e-06, "epoch": 1.73, "percentage": 86.35, "elapsed_time": "17:13:41", "remaining_time": "2:43:21"} +{"current_steps": 6100, "total_steps": 7064, "loss": 0.7885, "reward": null, "learning_rate": 2.2671846093243493e-06, "epoch": 1.73, "percentage": 86.35, "elapsed_time": "17:13:40", "remaining_time": "2:43:21"} +{"current_steps": 6100, "total_steps": 7064, "loss": 0.7885, "reward": null, "learning_rate": 2.2671846093243493e-06, "epoch": 1.73, "percentage": 86.35, "elapsed_time": "17:13:39", "remaining_time": "2:43:21"} +{"current_steps": 6110, "total_steps": 7064, "loss": 0.7876, "reward": null, "learning_rate": 2.221144725463359e-06, "epoch": 1.73, "percentage": 86.49, "elapsed_time": "17:15:27", "remaining_time": "2:41:40"} +{"current_steps": 6110, "total_steps": 7064, "loss": 0.7876, "reward": null, "learning_rate": 2.221144725463359e-06, "epoch": 1.73, "percentage": 86.49, "elapsed_time": "17:15:25", "remaining_time": "2:41:40"} +{"current_steps": 6110, "total_steps": 7064, "loss": 0.7876, "reward": null, "learning_rate": 2.221144725463359e-06, "epoch": 1.73, "percentage": 86.49, "elapsed_time": "17:15:26", "remaining_time": "2:41:40"} +{"current_steps": 6110, "total_steps": 7064, "loss": 0.7876, "reward": null, "learning_rate": 2.221144725463359e-06, "epoch": 1.73, "percentage": 86.49, "elapsed_time": "17:19:18", "remaining_time": "2:42:16"} +{"current_steps": 6120, "total_steps": 7064, "loss": 0.8012, "reward": null, "learning_rate": 2.1755553776488745e-06, "epoch": 1.73, "percentage": 86.64, "elapsed_time": "17:21:02", "remaining_time": "2:40:34"} +{"current_steps": 6120, "total_steps": 7064, "loss": 0.8012, "reward": null, "learning_rate": 2.1755553776488745e-06, "epoch": 1.73, "percentage": 86.64, "elapsed_time": "17:17:10", "remaining_time": "2:39:59"} +{"current_steps": 6120, "total_steps": 7064, "loss": 0.8012, "reward": null, "learning_rate": 2.1755553776488745e-06, "epoch": 1.73, "percentage": 86.64, "elapsed_time": "17:17:08", "remaining_time": "2:39:58"} +{"current_steps": 6120, "total_steps": 7064, "loss": 0.8012, "reward": null, "learning_rate": 2.1755553776488745e-06, "epoch": 1.73, "percentage": 86.64, "elapsed_time": "17:17:09", "remaining_time": "2:39:58"} +{"current_steps": 6130, "total_steps": 7064, "loss": 0.7967, "reward": null, "learning_rate": 2.130417467578724e-06, "epoch": 1.74, "percentage": 86.78, "elapsed_time": "17:18:53", "remaining_time": "2:38:17"} +{"current_steps": 6130, "total_steps": 7064, "loss": 0.7967, "reward": null, "learning_rate": 2.130417467578724e-06, "epoch": 1.74, "percentage": 86.78, "elapsed_time": "17:18:51", "remaining_time": "2:38:17"} +{"current_steps": 6130, "total_steps": 7064, "loss": 0.7967, "reward": null, "learning_rate": 2.130417467578724e-06, "epoch": 1.74, "percentage": 86.78, "elapsed_time": "17:18:52", "remaining_time": "2:38:17"} +{"current_steps": 6130, "total_steps": 7064, "loss": 0.7967, "reward": null, "learning_rate": 2.130417467578724e-06, "epoch": 1.74, "percentage": 86.78, "elapsed_time": "17:22:44", "remaining_time": "2:38:52"} +{"current_steps": 6140, "total_steps": 7064, "loss": 0.7827, "reward": null, "learning_rate": 2.0857318880218995e-06, "epoch": 1.74, "percentage": 86.92, "elapsed_time": "17:20:33", "remaining_time": "2:36:35"} +{"current_steps": 6140, "total_steps": 7064, "loss": 0.7827, "reward": null, "learning_rate": 2.0857318880218995e-06, "epoch": 1.74, "percentage": 86.92, "elapsed_time": "17:20:31", "remaining_time": "2:36:35"} +{"current_steps": 6140, "total_steps": 7064, "loss": 0.7827, "reward": null, "learning_rate": 2.0857318880218995e-06, "epoch": 1.74, "percentage": 86.92, "elapsed_time": "17:20:32", "remaining_time": "2:36:35"} +{"current_steps": 6140, "total_steps": 7064, "loss": 0.7827, "reward": null, "learning_rate": 2.0857318880218995e-06, "epoch": 1.74, "percentage": 86.92, "elapsed_time": "17:24:24", "remaining_time": "2:37:10"} +{"current_steps": 6150, "total_steps": 7064, "loss": 0.7657, "reward": null, "learning_rate": 2.0414995228008743e-06, "epoch": 1.74, "percentage": 87.06, "elapsed_time": "17:22:13", "remaining_time": "2:34:53"} +{"current_steps": 6150, "total_steps": 7064, "loss": 0.7657, "reward": null, "learning_rate": 2.0414995228008743e-06, "epoch": 1.74, "percentage": 87.06, "elapsed_time": "17:26:04", "remaining_time": "2:35:27"} +{"current_steps": 6150, "total_steps": 7064, "loss": 0.7657, "reward": null, "learning_rate": 2.0414995228008743e-06, "epoch": 1.74, "percentage": 87.06, "elapsed_time": "17:22:11", "remaining_time": "2:34:53"} +{"current_steps": 6150, "total_steps": 7064, "loss": 0.7657, "reward": null, "learning_rate": 2.0414995228008743e-06, "epoch": 1.74, "percentage": 87.06, "elapsed_time": "17:22:12", "remaining_time": "2:34:53"} +{"current_steps": 6160, "total_steps": 7064, "loss": 0.7655, "reward": null, "learning_rate": 1.997721246774145e-06, "epoch": 1.74, "percentage": 87.2, "elapsed_time": "17:27:45", "remaining_time": "2:33:45"} +{"current_steps": 6160, "total_steps": 7064, "loss": 0.7655, "reward": null, "learning_rate": 1.997721246774145e-06, "epoch": 1.74, "percentage": 87.2, "elapsed_time": "17:23:54", "remaining_time": "2:33:11"} +{"current_steps": 6160, "total_steps": 7064, "loss": 0.7655, "reward": null, "learning_rate": 1.997721246774145e-06, "epoch": 1.74, "percentage": 87.2, "elapsed_time": "17:23:53", "remaining_time": "2:33:11"} +{"current_steps": 6160, "total_steps": 7064, "loss": 0.7655, "reward": null, "learning_rate": 1.997721246774145e-06, "epoch": 1.74, "percentage": 87.2, "elapsed_time": "17:23:52", "remaining_time": "2:33:11"} +{"current_steps": 6170, "total_steps": 7064, "loss": 0.7713, "reward": null, "learning_rate": 1.9543979258189126e-06, "epoch": 1.75, "percentage": 87.34, "elapsed_time": "17:25:35", "remaining_time": "2:31:30"} +{"current_steps": 6170, "total_steps": 7064, "loss": 0.7713, "reward": null, "learning_rate": 1.9543979258189126e-06, "epoch": 1.75, "percentage": 87.34, "elapsed_time": "17:29:27", "remaining_time": "2:32:03"} +{"current_steps": 6170, "total_steps": 7064, "loss": 0.7713, "reward": null, "learning_rate": 1.9543979258189126e-06, "epoch": 1.75, "percentage": 87.34, "elapsed_time": "17:25:34", "remaining_time": "2:31:29"} +{"current_steps": 6170, "total_steps": 7064, "loss": 0.7713, "reward": null, "learning_rate": 1.9543979258189126e-06, "epoch": 1.75, "percentage": 87.34, "elapsed_time": "17:25:33", "remaining_time": "2:31:29"} +{"current_steps": 6180, "total_steps": 7064, "loss": 0.7871, "reward": null, "learning_rate": 1.911530416813953e-06, "epoch": 1.75, "percentage": 87.49, "elapsed_time": "17:31:09", "remaining_time": "2:30:21"} +{"current_steps": 6180, "total_steps": 7064, "loss": 0.7871, "reward": null, "learning_rate": 1.911530416813953e-06, "epoch": 1.75, "percentage": 87.49, "elapsed_time": "17:27:16", "remaining_time": "2:29:48"} +{"current_steps": 6180, "total_steps": 7064, "loss": 0.7871, "reward": null, "learning_rate": 1.911530416813953e-06, "epoch": 1.75, "percentage": 87.49, "elapsed_time": "17:27:17", "remaining_time": "2:29:48"} +{"current_steps": 6180, "total_steps": 7064, "loss": 0.7871, "reward": null, "learning_rate": 1.911530416813953e-06, "epoch": 1.75, "percentage": 87.49, "elapsed_time": "17:27:18", "remaining_time": "2:29:48"} +{"current_steps": 6190, "total_steps": 7064, "loss": 0.7983, "reward": null, "learning_rate": 1.869119567622679e-06, "epoch": 1.75, "percentage": 87.63, "elapsed_time": "17:28:56", "remaining_time": "2:28:06"} +{"current_steps": 6190, "total_steps": 7064, "loss": 0.7983, "reward": null, "learning_rate": 1.869119567622679e-06, "epoch": 1.75, "percentage": 87.63, "elapsed_time": "17:32:49", "remaining_time": "2:28:39"} +{"current_steps": 6190, "total_steps": 7064, "loss": 0.7983, "reward": null, "learning_rate": 1.869119567622679e-06, "epoch": 1.75, "percentage": 87.63, "elapsed_time": "17:28:57", "remaining_time": "2:28:06"} +{"current_steps": 6190, "total_steps": 7064, "loss": 0.7983, "reward": null, "learning_rate": 1.869119567622679e-06, "epoch": 1.75, "percentage": 87.63, "elapsed_time": "17:28:58", "remaining_time": "2:28:06"} +{"current_steps": 6200, "total_steps": 7064, "loss": 0.8057, "reward": null, "learning_rate": 1.8271662170763787e-06, "epoch": 1.76, "percentage": 87.77, "elapsed_time": "17:34:34", "remaining_time": "2:26:57"} +{"current_steps": 6200, "total_steps": 7064, "loss": 0.8057, "reward": null, "learning_rate": 1.8271662170763787e-06, "epoch": 1.76, "percentage": 87.77, "elapsed_time": "17:30:41", "remaining_time": "2:26:25"} +{"current_steps": 6200, "total_steps": 7064, "loss": 0.8057, "reward": null, "learning_rate": 1.8271662170763787e-06, "epoch": 1.76, "percentage": 87.77, "elapsed_time": "17:30:42", "remaining_time": "2:26:25"} +{"current_steps": 6200, "total_steps": 7064, "loss": 0.8057, "reward": null, "learning_rate": 1.8271662170763787e-06, "epoch": 1.76, "percentage": 87.77, "elapsed_time": "17:30:43", "remaining_time": "2:26:25"} +{"current_steps": 6210, "total_steps": 7064, "loss": 0.7798, "reward": null, "learning_rate": 1.7856711949575972e-06, "epoch": 1.76, "percentage": 87.91, "elapsed_time": "17:32:24", "remaining_time": "2:24:43"} +{"current_steps": 6210, "total_steps": 7064, "loss": 0.7798, "reward": null, "learning_rate": 1.7856711949575972e-06, "epoch": 1.76, "percentage": 87.91, "elapsed_time": "17:32:22", "remaining_time": "2:24:43"} +{"current_steps": 6210, "total_steps": 7064, "loss": 0.7798, "reward": null, "learning_rate": 1.7856711949575972e-06, "epoch": 1.76, "percentage": 87.91, "elapsed_time": "17:32:23", "remaining_time": "2:24:43"} +{"current_steps": 6210, "total_steps": 7064, "loss": 0.7798, "reward": null, "learning_rate": 1.7856711949575972e-06, "epoch": 1.76, "percentage": 87.91, "elapsed_time": "17:36:15", "remaining_time": "2:25:15"} +{"current_steps": 6220, "total_steps": 7064, "loss": 0.7845, "reward": null, "learning_rate": 1.7446353219837592e-06, "epoch": 1.76, "percentage": 88.05, "elapsed_time": "17:34:09", "remaining_time": "2:23:02"} +{"current_steps": 6220, "total_steps": 7064, "loss": 0.7845, "reward": null, "learning_rate": 1.7446353219837592e-06, "epoch": 1.76, "percentage": 88.05, "elapsed_time": "17:38:00", "remaining_time": "2:23:33"} +{"current_steps": 6220, "total_steps": 7064, "loss": 0.7845, "reward": null, "learning_rate": 1.7446353219837592e-06, "epoch": 1.76, "percentage": 88.05, "elapsed_time": "17:34:07", "remaining_time": "2:23:02"} +{"current_steps": 6220, "total_steps": 7064, "loss": 0.7845, "reward": null, "learning_rate": 1.7446353219837592e-06, "epoch": 1.76, "percentage": 88.05, "elapsed_time": "17:34:08", "remaining_time": "2:23:02"} +{"current_steps": 6230, "total_steps": 7064, "loss": 0.7907, "reward": null, "learning_rate": 1.704059409790898e-06, "epoch": 1.76, "percentage": 88.19, "elapsed_time": "17:35:52", "remaining_time": "2:21:20"} +{"current_steps": 6230, "total_steps": 7064, "loss": 0.7907, "reward": null, "learning_rate": 1.704059409790898e-06, "epoch": 1.76, "percentage": 88.19, "elapsed_time": "17:35:50", "remaining_time": "2:21:20"} +{"current_steps": 6230, "total_steps": 7064, "loss": 0.7907, "reward": null, "learning_rate": 1.704059409790898e-06, "epoch": 1.76, "percentage": 88.19, "elapsed_time": "17:39:43", "remaining_time": "2:21:51"} +{"current_steps": 6230, "total_steps": 7064, "loss": 0.7907, "reward": null, "learning_rate": 1.704059409790898e-06, "epoch": 1.76, "percentage": 88.19, "elapsed_time": "17:35:51", "remaining_time": "2:21:20"} +{"current_steps": 6240, "total_steps": 7064, "loss": 0.778, "reward": null, "learning_rate": 1.6639442609176409e-06, "epoch": 1.77, "percentage": 88.34, "elapsed_time": "17:37:33", "remaining_time": "2:19:39"} +{"current_steps": 6240, "total_steps": 7064, "loss": 0.778, "reward": null, "learning_rate": 1.6639442609176409e-06, "epoch": 1.77, "percentage": 88.34, "elapsed_time": "17:37:31", "remaining_time": "2:19:38"} +{"current_steps": 6240, "total_steps": 7064, "loss": 0.778, "reward": null, "learning_rate": 1.6639442609176409e-06, "epoch": 1.77, "percentage": 88.34, "elapsed_time": "17:37:31", "remaining_time": "2:19:38"} +{"current_steps": 6240, "total_steps": 7064, "loss": 0.778, "reward": null, "learning_rate": 1.6639442609176409e-06, "epoch": 1.77, "percentage": 88.34, "elapsed_time": "17:41:24", "remaining_time": "2:20:09"} +{"current_steps": 6250, "total_steps": 7064, "loss": 0.7924, "reward": null, "learning_rate": 1.6242906687893077e-06, "epoch": 1.77, "percentage": 88.48, "elapsed_time": "17:39:17", "remaining_time": "2:17:57"} +{"current_steps": 6250, "total_steps": 7064, "loss": 0.7924, "reward": null, "learning_rate": 1.6242906687893077e-06, "epoch": 1.77, "percentage": 88.48, "elapsed_time": "17:43:08", "remaining_time": "2:18:27"} +{"current_steps": 6250, "total_steps": 7064, "loss": 0.7924, "reward": null, "learning_rate": 1.6242906687893077e-06, "epoch": 1.77, "percentage": 88.48, "elapsed_time": "17:39:16", "remaining_time": "2:17:57"} +{"current_steps": 6250, "total_steps": 7064, "loss": 0.7924, "reward": null, "learning_rate": 1.6242906687893077e-06, "epoch": 1.77, "percentage": 88.48, "elapsed_time": "17:39:15", "remaining_time": "2:17:57"} +{"current_steps": 6260, "total_steps": 7064, "loss": 0.7988, "reward": null, "learning_rate": 1.5850994177022265e-06, "epoch": 1.77, "percentage": 88.62, "elapsed_time": "17:41:00", "remaining_time": "2:16:16"} +{"current_steps": 6260, "total_steps": 7064, "loss": 0.7988, "reward": null, "learning_rate": 1.5850994177022265e-06, "epoch": 1.77, "percentage": 88.62, "elapsed_time": "17:44:51", "remaining_time": "2:16:45"} +{"current_steps": 6260, "total_steps": 7064, "loss": 0.7988, "reward": null, "learning_rate": 1.5850994177022265e-06, "epoch": 1.77, "percentage": 88.62, "elapsed_time": "17:40:58", "remaining_time": "2:16:15"} +{"current_steps": 6260, "total_steps": 7064, "loss": 0.7988, "reward": null, "learning_rate": 1.5850994177022265e-06, "epoch": 1.77, "percentage": 88.62, "elapsed_time": "17:40:59", "remaining_time": "2:16:16"} +{"current_steps": 6270, "total_steps": 7064, "loss": 0.7741, "reward": null, "learning_rate": 1.546371282808226e-06, "epoch": 1.78, "percentage": 88.76, "elapsed_time": "17:46:32", "remaining_time": "2:15:03"} +{"current_steps": 6270, "total_steps": 7064, "loss": 0.7741, "reward": null, "learning_rate": 1.546371282808226e-06, "epoch": 1.78, "percentage": 88.76, "elapsed_time": "17:42:38", "remaining_time": "2:14:34"} +{"current_steps": 6270, "total_steps": 7064, "loss": 0.7741, "reward": null, "learning_rate": 1.546371282808226e-06, "epoch": 1.78, "percentage": 88.76, "elapsed_time": "17:42:39", "remaining_time": "2:14:34"} +{"current_steps": 6270, "total_steps": 7064, "loss": 0.7741, "reward": null, "learning_rate": 1.546371282808226e-06, "epoch": 1.78, "percentage": 88.76, "elapsed_time": "17:42:40", "remaining_time": "2:14:34"} +{"current_steps": 6280, "total_steps": 7064, "loss": 0.7944, "reward": null, "learning_rate": 1.508107030099304e-06, "epoch": 1.78, "percentage": 88.9, "elapsed_time": "17:44:24", "remaining_time": "2:12:52"} +{"current_steps": 6280, "total_steps": 7064, "loss": 0.7944, "reward": null, "learning_rate": 1.508107030099304e-06, "epoch": 1.78, "percentage": 88.9, "elapsed_time": "17:44:23", "remaining_time": "2:12:52"} +{"current_steps": 6280, "total_steps": 7064, "loss": 0.7944, "reward": null, "learning_rate": 1.508107030099304e-06, "epoch": 1.78, "percentage": 88.9, "elapsed_time": "17:48:15", "remaining_time": "2:13:21"} +{"current_steps": 6280, "total_steps": 7064, "loss": 0.7944, "reward": null, "learning_rate": 1.508107030099304e-06, "epoch": 1.78, "percentage": 88.9, "elapsed_time": "17:44:22", "remaining_time": "2:12:52"} +{"current_steps": 6290, "total_steps": 7064, "loss": 0.7845, "reward": null, "learning_rate": 1.4703074163924718e-06, "epoch": 1.78, "percentage": 89.04, "elapsed_time": "17:46:05", "remaining_time": "2:11:11"} +{"current_steps": 6290, "total_steps": 7064, "loss": 0.7845, "reward": null, "learning_rate": 1.4703074163924718e-06, "epoch": 1.78, "percentage": 89.04, "elapsed_time": "17:49:56", "remaining_time": "2:11:39"} +{"current_steps": 6290, "total_steps": 7064, "loss": 0.7845, "reward": null, "learning_rate": 1.4703074163924718e-06, "epoch": 1.78, "percentage": 89.04, "elapsed_time": "17:46:04", "remaining_time": "2:11:10"} +{"current_steps": 6290, "total_steps": 7064, "loss": 0.7845, "reward": null, "learning_rate": 1.4703074163924718e-06, "epoch": 1.78, "percentage": 89.04, "elapsed_time": "17:46:03", "remaining_time": "2:11:10"} +{"current_steps": 6300, "total_steps": 7064, "loss": 0.7832, "reward": null, "learning_rate": 1.4329731893147792e-06, "epoch": 1.78, "percentage": 89.18, "elapsed_time": "17:47:45", "remaining_time": "2:09:29"} +{"current_steps": 6300, "total_steps": 7064, "loss": 0.7832, "reward": null, "learning_rate": 1.4329731893147792e-06, "epoch": 1.78, "percentage": 89.18, "elapsed_time": "17:51:36", "remaining_time": "2:09:57"} +{"current_steps": 6300, "total_steps": 7064, "loss": 0.7832, "reward": null, "learning_rate": 1.4329731893147792e-06, "epoch": 1.78, "percentage": 89.18, "elapsed_time": "17:47:43", "remaining_time": "2:09:28"} +{"current_steps": 6300, "total_steps": 7064, "loss": 0.7832, "reward": null, "learning_rate": 1.4329731893147792e-06, "epoch": 1.78, "percentage": 89.18, "elapsed_time": "17:47:44", "remaining_time": "2:09:29"} +{"current_steps": 6310, "total_steps": 7064, "loss": 0.7933, "reward": null, "learning_rate": 1.396105087288549e-06, "epoch": 1.79, "percentage": 89.33, "elapsed_time": "17:49:26", "remaining_time": "2:07:47"} +{"current_steps": 6310, "total_steps": 7064, "loss": 0.7933, "reward": null, "learning_rate": 1.396105087288549e-06, "epoch": 1.79, "percentage": 89.33, "elapsed_time": "17:49:28", "remaining_time": "2:07:47"} +{"current_steps": 6310, "total_steps": 7064, "loss": 0.7933, "reward": null, "learning_rate": 1.396105087288549e-06, "epoch": 1.79, "percentage": 89.33, "elapsed_time": "17:49:27", "remaining_time": "2:07:47"} +{"current_steps": 6310, "total_steps": 7064, "loss": 0.7933, "reward": null, "learning_rate": 1.396105087288549e-06, "epoch": 1.79, "percentage": 89.33, "elapsed_time": "17:53:19", "remaining_time": "2:08:15"} +{"current_steps": 6320, "total_steps": 7064, "loss": 0.7803, "reward": null, "learning_rate": 1.3597038395167516e-06, "epoch": 1.79, "percentage": 89.47, "elapsed_time": "17:55:00", "remaining_time": "2:06:33"} +{"current_steps": 6320, "total_steps": 7064, "loss": 0.7803, "reward": null, "learning_rate": 1.3597038395167516e-06, "epoch": 1.79, "percentage": 89.47, "elapsed_time": "17:51:09", "remaining_time": "2:06:05"} +{"current_steps": 6320, "total_steps": 7064, "loss": 0.7803, "reward": null, "learning_rate": 1.3597038395167516e-06, "epoch": 1.79, "percentage": 89.47, "elapsed_time": "17:51:08", "remaining_time": "2:06:05"} +{"current_steps": 6320, "total_steps": 7064, "loss": 0.7803, "reward": null, "learning_rate": 1.3597038395167516e-06, "epoch": 1.79, "percentage": 89.47, "elapsed_time": "17:51:07", "remaining_time": "2:06:05"} +{"current_steps": 6330, "total_steps": 7064, "loss": 0.7794, "reward": null, "learning_rate": 1.3237701659685854e-06, "epoch": 1.79, "percentage": 89.61, "elapsed_time": "17:52:47", "remaining_time": "2:04:23"} +{"current_steps": 6330, "total_steps": 7064, "loss": 0.7794, "reward": null, "learning_rate": 1.3237701659685854e-06, "epoch": 1.79, "percentage": 89.61, "elapsed_time": "17:56:38", "remaining_time": "2:04:50"} +{"current_steps": 6330, "total_steps": 7064, "loss": 0.7794, "reward": null, "learning_rate": 1.3237701659685854e-06, "epoch": 1.79, "percentage": 89.61, "elapsed_time": "17:52:45", "remaining_time": "2:04:23"} +{"current_steps": 6330, "total_steps": 7064, "loss": 0.7794, "reward": null, "learning_rate": 1.3237701659685854e-06, "epoch": 1.79, "percentage": 89.61, "elapsed_time": "17:52:46", "remaining_time": "2:04:23"} +{"current_steps": 6340, "total_steps": 7064, "loss": 0.7715, "reward": null, "learning_rate": 1.28830477736524e-06, "epoch": 1.8, "percentage": 89.75, "elapsed_time": "17:58:17", "remaining_time": "2:03:08"} +{"current_steps": 6340, "total_steps": 7064, "loss": 0.7715, "reward": null, "learning_rate": 1.28830477736524e-06, "epoch": 1.8, "percentage": 89.75, "elapsed_time": "17:54:25", "remaining_time": "2:02:41"} +{"current_steps": 6340, "total_steps": 7064, "loss": 0.7715, "reward": null, "learning_rate": 1.28830477736524e-06, "epoch": 1.8, "percentage": 89.75, "elapsed_time": "17:54:23", "remaining_time": "2:02:41"} +{"current_steps": 6340, "total_steps": 7064, "loss": 0.7715, "reward": null, "learning_rate": 1.28830477736524e-06, "epoch": 1.8, "percentage": 89.75, "elapsed_time": "17:54:24", "remaining_time": "2:02:41"} +{"current_steps": 6350, "total_steps": 7064, "loss": 0.7918, "reward": null, "learning_rate": 1.253308375165857e-06, "epoch": 1.8, "percentage": 89.89, "elapsed_time": "18:00:01", "remaining_time": "2:01:26"} +{"current_steps": 6350, "total_steps": 7064, "loss": 0.7918, "reward": null, "learning_rate": 1.253308375165857e-06, "epoch": 1.8, "percentage": 89.89, "elapsed_time": "17:56:08", "remaining_time": "2:01:00"} +{"current_steps": 6350, "total_steps": 7064, "loss": 0.7918, "reward": null, "learning_rate": 1.253308375165857e-06, "epoch": 1.8, "percentage": 89.89, "elapsed_time": "17:56:09", "remaining_time": "2:01:00"} +{"current_steps": 6350, "total_steps": 7064, "loss": 0.7918, "reward": null, "learning_rate": 1.253308375165857e-06, "epoch": 1.8, "percentage": 89.89, "elapsed_time": "17:56:10", "remaining_time": "2:01:00"} +{"current_steps": 6360, "total_steps": 7064, "loss": 0.7829, "reward": null, "learning_rate": 1.2187816515536105e-06, "epoch": 1.8, "percentage": 90.03, "elapsed_time": "17:57:52", "remaining_time": "1:59:18"} +{"current_steps": 6360, "total_steps": 7064, "loss": 0.7829, "reward": null, "learning_rate": 1.2187816515536105e-06, "epoch": 1.8, "percentage": 90.03, "elapsed_time": "18:01:43", "remaining_time": "1:59:44"} +{"current_steps": 6360, "total_steps": 7064, "loss": 0.7829, "reward": null, "learning_rate": 1.2187816515536105e-06, "epoch": 1.8, "percentage": 90.03, "elapsed_time": "17:57:51", "remaining_time": "1:59:18"} +{"current_steps": 6360, "total_steps": 7064, "loss": 0.7829, "reward": null, "learning_rate": 1.2187816515536105e-06, "epoch": 1.8, "percentage": 90.03, "elapsed_time": "17:57:50", "remaining_time": "1:59:18"} +{"current_steps": 6370, "total_steps": 7064, "loss": 0.7932, "reward": null, "learning_rate": 1.184725289422073e-06, "epoch": 1.8, "percentage": 90.18, "elapsed_time": "18:03:26", "remaining_time": "1:58:02"} +{"current_steps": 6370, "total_steps": 7064, "loss": 0.7932, "reward": null, "learning_rate": 1.184725289422073e-06, "epoch": 1.8, "percentage": 90.18, "elapsed_time": "17:59:34", "remaining_time": "1:57:37"} +{"current_steps": 6370, "total_steps": 7064, "loss": 0.7932, "reward": null, "learning_rate": 1.184725289422073e-06, "epoch": 1.8, "percentage": 90.18, "elapsed_time": "17:59:33", "remaining_time": "1:57:36"} +{"current_steps": 6370, "total_steps": 7064, "loss": 0.7932, "reward": null, "learning_rate": 1.184725289422073e-06, "epoch": 1.8, "percentage": 90.18, "elapsed_time": "17:59:35", "remaining_time": "1:57:37"} +{"current_steps": 6380, "total_steps": 7064, "loss": 0.7838, "reward": null, "learning_rate": 1.151139962361658e-06, "epoch": 1.81, "percentage": 90.32, "elapsed_time": "18:05:07", "remaining_time": "1:56:20"} +{"current_steps": 6380, "total_steps": 7064, "loss": 0.7838, "reward": null, "learning_rate": 1.151139962361658e-06, "epoch": 1.81, "percentage": 90.32, "elapsed_time": "18:01:15", "remaining_time": "1:55:55"} +{"current_steps": 6380, "total_steps": 7064, "loss": 0.7838, "reward": null, "learning_rate": 1.151139962361658e-06, "epoch": 1.81, "percentage": 90.32, "elapsed_time": "18:01:14", "remaining_time": "1:55:55"} +{"current_steps": 6380, "total_steps": 7064, "loss": 0.7838, "reward": null, "learning_rate": 1.151139962361658e-06, "epoch": 1.81, "percentage": 90.32, "elapsed_time": "18:01:13", "remaining_time": "1:55:55"} +{"current_steps": 6390, "total_steps": 7064, "loss": 0.7767, "reward": null, "learning_rate": 1.1180263346463327e-06, "epoch": 1.81, "percentage": 90.46, "elapsed_time": "18:03:02", "remaining_time": "1:54:14"} +{"current_steps": 6390, "total_steps": 7064, "loss": 0.7767, "reward": null, "learning_rate": 1.1180263346463327e-06, "epoch": 1.81, "percentage": 90.46, "elapsed_time": "18:06:54", "remaining_time": "1:54:38"} +{"current_steps": 6390, "total_steps": 7064, "loss": 0.7767, "reward": null, "learning_rate": 1.1180263346463327e-06, "epoch": 1.81, "percentage": 90.46, "elapsed_time": "18:03:01", "remaining_time": "1:54:14"} +{"current_steps": 6390, "total_steps": 7064, "loss": 0.7767, "reward": null, "learning_rate": 1.1180263346463327e-06, "epoch": 1.81, "percentage": 90.46, "elapsed_time": "18:03:00", "remaining_time": "1:54:14"} +{"current_steps": 6400, "total_steps": 7064, "loss": 0.7757, "reward": null, "learning_rate": 1.0853850612204646e-06, "epoch": 1.81, "percentage": 90.6, "elapsed_time": "18:04:46", "remaining_time": "1:52:32"} +{"current_steps": 6400, "total_steps": 7064, "loss": 0.7757, "reward": null, "learning_rate": 1.0853850612204646e-06, "epoch": 1.81, "percentage": 90.6, "elapsed_time": "18:08:38", "remaining_time": "1:52:56"} +{"current_steps": 6400, "total_steps": 7064, "loss": 0.7757, "reward": null, "learning_rate": 1.0853850612204646e-06, "epoch": 1.81, "percentage": 90.6, "elapsed_time": "18:04:44", "remaining_time": "1:52:32"} +{"current_steps": 6400, "total_steps": 7064, "loss": 0.7757, "reward": null, "learning_rate": 1.0853850612204646e-06, "epoch": 1.81, "percentage": 90.6, "elapsed_time": "18:04:45", "remaining_time": "1:52:32"} +{"current_steps": 6410, "total_steps": 7064, "loss": 0.779, "reward": null, "learning_rate": 1.053216787685865e-06, "epoch": 1.81, "percentage": 90.74, "elapsed_time": "18:10:18", "remaining_time": "1:51:14"} +{"current_steps": 6410, "total_steps": 7064, "loss": 0.779, "reward": null, "learning_rate": 1.053216787685865e-06, "epoch": 1.81, "percentage": 90.74, "elapsed_time": "18:06:27", "remaining_time": "1:50:50"} +{"current_steps": 6410, "total_steps": 7064, "loss": 0.779, "reward": null, "learning_rate": 1.053216787685865e-06, "epoch": 1.81, "percentage": 90.74, "elapsed_time": "18:06:26", "remaining_time": "1:50:50"} +{"current_steps": 6410, "total_steps": 7064, "loss": 0.779, "reward": null, "learning_rate": 1.053216787685865e-06, "epoch": 1.81, "percentage": 90.74, "elapsed_time": "18:06:25", "remaining_time": "1:50:50"} +{"current_steps": 6420, "total_steps": 7064, "loss": 0.7789, "reward": null, "learning_rate": 1.0215221502890254e-06, "epoch": 1.82, "percentage": 90.88, "elapsed_time": "18:08:14", "remaining_time": "1:49:09"} +{"current_steps": 6420, "total_steps": 7064, "loss": 0.7789, "reward": null, "learning_rate": 1.0215221502890254e-06, "epoch": 1.82, "percentage": 90.88, "elapsed_time": "18:12:05", "remaining_time": "1:49:32"} +{"current_steps": 6420, "total_steps": 7064, "loss": 0.7789, "reward": null, "learning_rate": 1.0215221502890254e-06, "epoch": 1.82, "percentage": 90.88, "elapsed_time": "18:08:12", "remaining_time": "1:49:09"} +{"current_steps": 6420, "total_steps": 7064, "loss": 0.7789, "reward": null, "learning_rate": 1.0215221502890254e-06, "epoch": 1.82, "percentage": 90.88, "elapsed_time": "18:08:13", "remaining_time": "1:49:09"} +{"current_steps": 6430, "total_steps": 7064, "loss": 0.7738, "reward": null, "learning_rate": 9.903017759085365e-07, "epoch": 1.82, "percentage": 91.02, "elapsed_time": "18:09:52", "remaining_time": "1:47:27"} +{"current_steps": 6430, "total_steps": 7064, "loss": 0.7738, "reward": null, "learning_rate": 9.903017759085365e-07, "epoch": 1.82, "percentage": 91.02, "elapsed_time": "18:13:44", "remaining_time": "1:47:50"} +{"current_steps": 6430, "total_steps": 7064, "loss": 0.7738, "reward": null, "learning_rate": 9.903017759085365e-07, "epoch": 1.82, "percentage": 91.02, "elapsed_time": "18:09:51", "remaining_time": "1:47:27"} +{"current_steps": 6430, "total_steps": 7064, "loss": 0.7738, "reward": null, "learning_rate": 9.903017759085365e-07, "epoch": 1.82, "percentage": 91.02, "elapsed_time": "18:09:50", "remaining_time": "1:47:27"} +{"current_steps": 6440, "total_steps": 7064, "loss": 0.7873, "reward": null, "learning_rate": 9.595562820426758e-07, "epoch": 1.82, "percentage": 91.17, "elapsed_time": "18:11:34", "remaining_time": "1:45:46"} +{"current_steps": 6440, "total_steps": 7064, "loss": 0.7873, "reward": null, "learning_rate": 9.595562820426758e-07, "epoch": 1.82, "percentage": 91.17, "elapsed_time": "18:11:32", "remaining_time": "1:45:45"} +{"current_steps": 6440, "total_steps": 7064, "loss": 0.7873, "reward": null, "learning_rate": 9.595562820426758e-07, "epoch": 1.82, "percentage": 91.17, "elapsed_time": "18:11:32", "remaining_time": "1:45:45"} +{"current_steps": 6440, "total_steps": 7064, "loss": 0.7873, "reward": null, "learning_rate": 9.595562820426758e-07, "epoch": 1.82, "percentage": 91.17, "elapsed_time": "18:15:25", "remaining_time": "1:46:08"} +{"current_steps": 6450, "total_steps": 7064, "loss": 0.7923, "reward": null, "learning_rate": 9.292862767972199e-07, "epoch": 1.83, "percentage": 91.31, "elapsed_time": "18:13:19", "remaining_time": "1:44:04"} +{"current_steps": 6450, "total_steps": 7064, "loss": 0.7923, "reward": null, "learning_rate": 9.292862767972199e-07, "epoch": 1.83, "percentage": 91.31, "elapsed_time": "18:17:11", "remaining_time": "1:44:26"} +{"current_steps": 6450, "total_steps": 7064, "loss": 0.7923, "reward": null, "learning_rate": 9.292862767972199e-07, "epoch": 1.83, "percentage": 91.31, "elapsed_time": "18:13:17", "remaining_time": "1:44:04"} +{"current_steps": 6450, "total_steps": 7064, "loss": 0.7923, "reward": null, "learning_rate": 9.292862767972199e-07, "epoch": 1.83, "percentage": 91.31, "elapsed_time": "18:13:18", "remaining_time": "1:44:04"} +{"current_steps": 6460, "total_steps": 7064, "loss": 0.7888, "reward": null, "learning_rate": 8.994923588733856e-07, "epoch": 1.83, "percentage": 91.45, "elapsed_time": "18:15:00", "remaining_time": "1:42:22"} +{"current_steps": 6460, "total_steps": 7064, "loss": 0.7888, "reward": null, "learning_rate": 8.994923588733856e-07, "epoch": 1.83, "percentage": 91.45, "elapsed_time": "18:18:51", "remaining_time": "1:42:44"} +{"current_steps": 6460, "total_steps": 7064, "loss": 0.7888, "reward": null, "learning_rate": 8.994923588733856e-07, "epoch": 1.83, "percentage": 91.45, "elapsed_time": "18:14:58", "remaining_time": "1:42:22"} +{"current_steps": 6460, "total_steps": 7064, "loss": 0.7888, "reward": null, "learning_rate": 8.994923588733856e-07, "epoch": 1.83, "percentage": 91.45, "elapsed_time": "18:14:59", "remaining_time": "1:42:22"} +{"current_steps": 6470, "total_steps": 7064, "loss": 0.7749, "reward": null, "learning_rate": 8.701751175560102e-07, "epoch": 1.83, "percentage": 91.59, "elapsed_time": "18:16:39", "remaining_time": "1:40:40"} +{"current_steps": 6470, "total_steps": 7064, "loss": 0.7749, "reward": null, "learning_rate": 8.701751175560102e-07, "epoch": 1.83, "percentage": 91.59, "elapsed_time": "18:20:32", "remaining_time": "1:41:02"} +{"current_steps": 6470, "total_steps": 7064, "loss": 0.7749, "reward": null, "learning_rate": 8.701751175560102e-07, "epoch": 1.83, "percentage": 91.59, "elapsed_time": "18:16:40", "remaining_time": "1:40:41"} +{"current_steps": 6470, "total_steps": 7064, "loss": 0.7749, "reward": null, "learning_rate": 8.701751175560102e-07, "epoch": 1.83, "percentage": 91.59, "elapsed_time": "18:16:41", "remaining_time": "1:40:41"} +{"current_steps": 6480, "total_steps": 7064, "loss": 0.7706, "reward": null, "learning_rate": 8.41335132701887e-07, "epoch": 1.83, "percentage": 91.73, "elapsed_time": "18:18:25", "remaining_time": "1:38:59"} +{"current_steps": 6480, "total_steps": 7064, "loss": 0.7706, "reward": null, "learning_rate": 8.41335132701887e-07, "epoch": 1.83, "percentage": 91.73, "elapsed_time": "18:22:17", "remaining_time": "1:39:20"} +{"current_steps": 6480, "total_steps": 7064, "loss": 0.7706, "reward": null, "learning_rate": 8.41335132701887e-07, "epoch": 1.83, "percentage": 91.73, "elapsed_time": "18:18:24", "remaining_time": "1:38:59"} +{"current_steps": 6480, "total_steps": 7064, "loss": 0.7706, "reward": null, "learning_rate": 8.41335132701887e-07, "epoch": 1.83, "percentage": 91.73, "elapsed_time": "18:18:23", "remaining_time": "1:38:59"} +{"current_steps": 6490, "total_steps": 7064, "loss": 0.7896, "reward": null, "learning_rate": 8.129729747283016e-07, "epoch": 1.84, "percentage": 91.87, "elapsed_time": "18:20:04", "remaining_time": "1:37:17"} +{"current_steps": 6490, "total_steps": 7064, "loss": 0.7896, "reward": null, "learning_rate": 8.129729747283016e-07, "epoch": 1.84, "percentage": 91.87, "elapsed_time": "18:23:56", "remaining_time": "1:37:38"} +{"current_steps": 6490, "total_steps": 7064, "loss": 0.7896, "reward": null, "learning_rate": 8.129729747283016e-07, "epoch": 1.84, "percentage": 91.87, "elapsed_time": "18:20:02", "remaining_time": "1:37:17"} +{"current_steps": 6490, "total_steps": 7064, "loss": 0.7896, "reward": null, "learning_rate": 8.129729747283016e-07, "epoch": 1.84, "percentage": 91.87, "elapsed_time": "18:20:03", "remaining_time": "1:37:17"} +{"current_steps": 6500, "total_steps": 7064, "loss": 0.7918, "reward": null, "learning_rate": 7.85089204601741e-07, "epoch": 1.84, "percentage": 92.02, "elapsed_time": "18:21:49", "remaining_time": "1:35:36"} +{"current_steps": 6500, "total_steps": 7064, "loss": 0.7918, "reward": null, "learning_rate": 7.85089204601741e-07, "epoch": 1.84, "percentage": 92.02, "elapsed_time": "18:25:40", "remaining_time": "1:35:56"} +{"current_steps": 6500, "total_steps": 7064, "loss": 0.7918, "reward": null, "learning_rate": 7.85089204601741e-07, "epoch": 1.84, "percentage": 92.02, "elapsed_time": "18:21:48", "remaining_time": "1:35:36"} +{"current_steps": 6500, "total_steps": 7064, "loss": 0.7918, "reward": null, "learning_rate": 7.85089204601741e-07, "epoch": 1.84, "percentage": 92.02, "elapsed_time": "18:21:47", "remaining_time": "1:35:36"} +{"current_steps": 6510, "total_steps": 7064, "loss": 0.7875, "reward": null, "learning_rate": 7.576843738268113e-07, "epoch": 1.84, "percentage": 92.16, "elapsed_time": "18:23:31", "remaining_time": "1:33:54"} +{"current_steps": 6510, "total_steps": 7064, "loss": 0.7875, "reward": null, "learning_rate": 7.576843738268113e-07, "epoch": 1.84, "percentage": 92.16, "elapsed_time": "18:27:22", "remaining_time": "1:34:14"} +{"current_steps": 6510, "total_steps": 7064, "loss": 0.7875, "reward": null, "learning_rate": 7.576843738268113e-07, "epoch": 1.84, "percentage": 92.16, "elapsed_time": "18:23:29", "remaining_time": "1:33:54"} +{"current_steps": 6510, "total_steps": 7064, "loss": 0.7875, "reward": null, "learning_rate": 7.576843738268113e-07, "epoch": 1.84, "percentage": 92.16, "elapsed_time": "18:23:30", "remaining_time": "1:33:54"} +{"current_steps": 6520, "total_steps": 7064, "loss": 0.7871, "reward": null, "learning_rate": 7.307590244353263e-07, "epoch": 1.85, "percentage": 92.3, "elapsed_time": "18:29:04", "remaining_time": "1:32:32"} +{"current_steps": 6520, "total_steps": 7064, "loss": 0.7871, "reward": null, "learning_rate": 7.307590244353263e-07, "epoch": 1.85, "percentage": 92.3, "elapsed_time": "18:25:13", "remaining_time": "1:32:12"} +{"current_steps": 6520, "total_steps": 7064, "loss": 0.7871, "reward": null, "learning_rate": 7.307590244353263e-07, "epoch": 1.85, "percentage": 92.3, "elapsed_time": "18:25:11", "remaining_time": "1:32:12"} +{"current_steps": 6520, "total_steps": 7064, "loss": 0.7871, "reward": null, "learning_rate": 7.307590244353263e-07, "epoch": 1.85, "percentage": 92.3, "elapsed_time": "18:25:12", "remaining_time": "1:32:12"} +{"current_steps": 6530, "total_steps": 7064, "loss": 0.7734, "reward": null, "learning_rate": 7.043136889755691e-07, "epoch": 1.85, "percentage": 92.44, "elapsed_time": "18:26:51", "remaining_time": "1:30:30"} +{"current_steps": 6530, "total_steps": 7064, "loss": 0.7734, "reward": null, "learning_rate": 7.043136889755691e-07, "epoch": 1.85, "percentage": 92.44, "elapsed_time": "18:30:42", "remaining_time": "1:30:49"} +{"current_steps": 6530, "total_steps": 7064, "loss": 0.7734, "reward": null, "learning_rate": 7.043136889755691e-07, "epoch": 1.85, "percentage": 92.44, "elapsed_time": "18:26:49", "remaining_time": "1:30:30"} +{"current_steps": 6530, "total_steps": 7064, "loss": 0.7734, "reward": null, "learning_rate": 7.043136889755691e-07, "epoch": 1.85, "percentage": 92.44, "elapsed_time": "18:26:50", "remaining_time": "1:30:30"} +{"current_steps": 6540, "total_steps": 7064, "loss": 0.7856, "reward": null, "learning_rate": 6.783488905017871e-07, "epoch": 1.85, "percentage": 92.58, "elapsed_time": "18:28:33", "remaining_time": "1:28:49"} +{"current_steps": 6540, "total_steps": 7064, "loss": 0.7856, "reward": null, "learning_rate": 6.783488905017871e-07, "epoch": 1.85, "percentage": 92.58, "elapsed_time": "18:32:24", "remaining_time": "1:29:07"} +{"current_steps": 6540, "total_steps": 7064, "loss": 0.7856, "reward": null, "learning_rate": 6.783488905017871e-07, "epoch": 1.85, "percentage": 92.58, "elapsed_time": "18:28:32", "remaining_time": "1:28:49"} +{"current_steps": 6540, "total_steps": 7064, "loss": 0.7856, "reward": null, "learning_rate": 6.783488905017871e-07, "epoch": 1.85, "percentage": 92.58, "elapsed_time": "18:28:31", "remaining_time": "1:28:49"} +{"current_steps": 6550, "total_steps": 7064, "loss": 0.7964, "reward": null, "learning_rate": 6.528651425638272e-07, "epoch": 1.85, "percentage": 92.72, "elapsed_time": "18:30:15", "remaining_time": "1:27:07"} +{"current_steps": 6550, "total_steps": 7064, "loss": 0.7964, "reward": null, "learning_rate": 6.528651425638272e-07, "epoch": 1.85, "percentage": 92.72, "elapsed_time": "18:34:06", "remaining_time": "1:27:25"} +{"current_steps": 6550, "total_steps": 7064, "loss": 0.7964, "reward": null, "learning_rate": 6.528651425638272e-07, "epoch": 1.85, "percentage": 92.72, "elapsed_time": "18:30:14", "remaining_time": "1:27:07"} +{"current_steps": 6550, "total_steps": 7064, "loss": 0.7964, "reward": null, "learning_rate": 6.528651425638272e-07, "epoch": 1.85, "percentage": 92.72, "elapsed_time": "18:30:13", "remaining_time": "1:27:07"} +{"current_steps": 6560, "total_steps": 7064, "loss": 0.778, "reward": null, "learning_rate": 6.278629491969862e-07, "epoch": 1.86, "percentage": 92.87, "elapsed_time": "18:35:47", "remaining_time": "1:25:43"} +{"current_steps": 6560, "total_steps": 7064, "loss": 0.778, "reward": null, "learning_rate": 6.278629491969862e-07, "epoch": 1.86, "percentage": 92.87, "elapsed_time": "18:31:53", "remaining_time": "1:25:25"} +{"current_steps": 6560, "total_steps": 7064, "loss": 0.778, "reward": null, "learning_rate": 6.278629491969862e-07, "epoch": 1.86, "percentage": 92.87, "elapsed_time": "18:31:54", "remaining_time": "1:25:25"} +{"current_steps": 6560, "total_steps": 7064, "loss": 0.778, "reward": null, "learning_rate": 6.278629491969862e-07, "epoch": 1.86, "percentage": 92.87, "elapsed_time": "18:31:55", "remaining_time": "1:25:25"} +{"current_steps": 6570, "total_steps": 7064, "loss": 0.7914, "reward": null, "learning_rate": 6.033428049120326e-07, "epoch": 1.86, "percentage": 93.01, "elapsed_time": "18:33:38", "remaining_time": "1:23:44"} +{"current_steps": 6570, "total_steps": 7064, "loss": 0.7914, "reward": null, "learning_rate": 6.033428049120326e-07, "epoch": 1.86, "percentage": 93.01, "elapsed_time": "18:33:37", "remaining_time": "1:23:43"} +{"current_steps": 6570, "total_steps": 7064, "loss": 0.7914, "reward": null, "learning_rate": 6.033428049120326e-07, "epoch": 1.86, "percentage": 93.01, "elapsed_time": "18:33:36", "remaining_time": "1:23:43"} +{"current_steps": 6570, "total_steps": 7064, "loss": 0.7914, "reward": null, "learning_rate": 6.033428049120326e-07, "epoch": 1.86, "percentage": 93.01, "elapsed_time": "18:37:29", "remaining_time": "1:24:01"} +{"current_steps": 6580, "total_steps": 7064, "loss": 0.7691, "reward": null, "learning_rate": 5.793051946854422e-07, "epoch": 1.86, "percentage": 93.15, "elapsed_time": "18:35:20", "remaining_time": "1:22:02"} +{"current_steps": 6580, "total_steps": 7064, "loss": 0.7691, "reward": null, "learning_rate": 5.793051946854422e-07, "epoch": 1.86, "percentage": 93.15, "elapsed_time": "18:35:18", "remaining_time": "1:22:02"} +{"current_steps": 6580, "total_steps": 7064, "loss": 0.7691, "reward": null, "learning_rate": 5.793051946854422e-07, "epoch": 1.86, "percentage": 93.15, "elapsed_time": "18:35:19", "remaining_time": "1:22:02"} +{"current_steps": 6580, "total_steps": 7064, "loss": 0.7691, "reward": null, "learning_rate": 5.793051946854422e-07, "epoch": 1.86, "percentage": 93.15, "elapsed_time": "18:39:11", "remaining_time": "1:22:19"} +{"current_steps": 6590, "total_steps": 7064, "loss": 0.7893, "reward": null, "learning_rate": 5.557505939497915e-07, "epoch": 1.87, "percentage": 93.29, "elapsed_time": "18:37:01", "remaining_time": "1:20:20"} +{"current_steps": 6590, "total_steps": 7064, "loss": 0.7893, "reward": null, "learning_rate": 5.557505939497915e-07, "epoch": 1.87, "percentage": 93.29, "elapsed_time": "18:37:00", "remaining_time": "1:20:20"} +{"current_steps": 6590, "total_steps": 7064, "loss": 0.7893, "reward": null, "learning_rate": 5.557505939497915e-07, "epoch": 1.87, "percentage": 93.29, "elapsed_time": "18:40:52", "remaining_time": "1:20:37"} +{"current_steps": 6590, "total_steps": 7064, "loss": 0.7893, "reward": null, "learning_rate": 5.557505939497915e-07, "epoch": 1.87, "percentage": 93.29, "elapsed_time": "18:36:59", "remaining_time": "1:20:20"} +{"current_steps": 6600, "total_steps": 7064, "loss": 0.7833, "reward": null, "learning_rate": 5.326794685843655e-07, "epoch": 1.87, "percentage": 93.43, "elapsed_time": "18:38:45", "remaining_time": "1:18:39"} +{"current_steps": 6600, "total_steps": 7064, "loss": 0.7833, "reward": null, "learning_rate": 5.326794685843655e-07, "epoch": 1.87, "percentage": 93.43, "elapsed_time": "18:38:43", "remaining_time": "1:18:38"} +{"current_steps": 6600, "total_steps": 7064, "loss": 0.7833, "reward": null, "learning_rate": 5.326794685843655e-07, "epoch": 1.87, "percentage": 93.43, "elapsed_time": "18:38:44", "remaining_time": "1:18:39"} +{"current_steps": 6600, "total_steps": 7064, "loss": 0.7833, "reward": null, "learning_rate": 5.326794685843655e-07, "epoch": 1.87, "percentage": 93.43, "elapsed_time": "18:42:36", "remaining_time": "1:18:55"} +{"current_steps": 6610, "total_steps": 7064, "loss": 0.7903, "reward": null, "learning_rate": 5.100922749059239e-07, "epoch": 1.87, "percentage": 93.57, "elapsed_time": "18:40:23", "remaining_time": "1:16:57"} +{"current_steps": 6610, "total_steps": 7064, "loss": 0.7903, "reward": null, "learning_rate": 5.100922749059239e-07, "epoch": 1.87, "percentage": 93.57, "elapsed_time": "18:40:21", "remaining_time": "1:16:56"} +{"current_steps": 6610, "total_steps": 7064, "loss": 0.7903, "reward": null, "learning_rate": 5.100922749059239e-07, "epoch": 1.87, "percentage": 93.57, "elapsed_time": "18:40:21", "remaining_time": "1:16:57"} +{"current_steps": 6610, "total_steps": 7064, "loss": 0.7903, "reward": null, "learning_rate": 5.100922749059239e-07, "epoch": 1.87, "percentage": 93.57, "elapsed_time": "18:44:14", "remaining_time": "1:17:13"} +{"current_steps": 6620, "total_steps": 7064, "loss": 0.7683, "reward": null, "learning_rate": 4.879894596597018e-07, "epoch": 1.87, "percentage": 93.71, "elapsed_time": "18:42:06", "remaining_time": "1:15:15"} +{"current_steps": 6620, "total_steps": 7064, "loss": 0.7683, "reward": null, "learning_rate": 4.879894596597018e-07, "epoch": 1.87, "percentage": 93.71, "elapsed_time": "18:45:57", "remaining_time": "1:15:31"} +{"current_steps": 6620, "total_steps": 7064, "loss": 0.7683, "reward": null, "learning_rate": 4.879894596597018e-07, "epoch": 1.87, "percentage": 93.71, "elapsed_time": "18:42:05", "remaining_time": "1:15:15"} +{"current_steps": 6620, "total_steps": 7064, "loss": 0.7683, "reward": null, "learning_rate": 4.879894596597018e-07, "epoch": 1.87, "percentage": 93.71, "elapsed_time": "18:42:04", "remaining_time": "1:15:15"} +{"current_steps": 6630, "total_steps": 7064, "loss": 0.7717, "reward": null, "learning_rate": 4.663714600105534e-07, "epoch": 1.88, "percentage": 93.86, "elapsed_time": "18:43:47", "remaining_time": "1:13:33"} +{"current_steps": 6630, "total_steps": 7064, "loss": 0.7717, "reward": null, "learning_rate": 4.663714600105534e-07, "epoch": 1.88, "percentage": 93.86, "elapsed_time": "18:47:39", "remaining_time": "1:13:48"} +{"current_steps": 6630, "total_steps": 7064, "loss": 0.7717, "reward": null, "learning_rate": 4.663714600105534e-07, "epoch": 1.88, "percentage": 93.86, "elapsed_time": "18:43:46", "remaining_time": "1:13:33"} +{"current_steps": 6630, "total_steps": 7064, "loss": 0.7717, "reward": null, "learning_rate": 4.663714600105534e-07, "epoch": 1.88, "percentage": 93.86, "elapsed_time": "18:43:45", "remaining_time": "1:13:33"} +{"current_steps": 6640, "total_steps": 7064, "loss": 0.7876, "reward": null, "learning_rate": 4.452387035343203e-07, "epoch": 1.88, "percentage": 94.0, "elapsed_time": "18:45:29", "remaining_time": "1:11:52"} +{"current_steps": 6640, "total_steps": 7064, "loss": 0.7876, "reward": null, "learning_rate": 4.452387035343203e-07, "epoch": 1.88, "percentage": 94.0, "elapsed_time": "18:45:27", "remaining_time": "1:11:52"} +{"current_steps": 6640, "total_steps": 7064, "loss": 0.7876, "reward": null, "learning_rate": 4.452387035343203e-07, "epoch": 1.88, "percentage": 94.0, "elapsed_time": "18:45:28", "remaining_time": "1:11:52"} +{"current_steps": 6640, "total_steps": 7064, "loss": 0.7876, "reward": null, "learning_rate": 4.452387035343203e-07, "epoch": 1.88, "percentage": 94.0, "elapsed_time": "18:49:21", "remaining_time": "1:12:06"} +{"current_steps": 6650, "total_steps": 7064, "loss": 0.7888, "reward": null, "learning_rate": 4.2459160820935153e-07, "epoch": 1.88, "percentage": 94.14, "elapsed_time": "18:47:08", "remaining_time": "1:10:10"} +{"current_steps": 6650, "total_steps": 7064, "loss": 0.7888, "reward": null, "learning_rate": 4.2459160820935153e-07, "epoch": 1.88, "percentage": 94.14, "elapsed_time": "18:51:00", "remaining_time": "1:10:24"} +{"current_steps": 6650, "total_steps": 7064, "loss": 0.7888, "reward": null, "learning_rate": 4.2459160820935153e-07, "epoch": 1.88, "percentage": 94.14, "elapsed_time": "18:47:07", "remaining_time": "1:10:10"} +{"current_steps": 6650, "total_steps": 7064, "loss": 0.7888, "reward": null, "learning_rate": 4.2459160820935153e-07, "epoch": 1.88, "percentage": 94.14, "elapsed_time": "18:47:06", "remaining_time": "1:10:10"} +{"current_steps": 6660, "total_steps": 7064, "loss": 0.7729, "reward": null, "learning_rate": 4.044305824082717e-07, "epoch": 1.89, "percentage": 94.28, "elapsed_time": "18:48:47", "remaining_time": "1:08:28"} +{"current_steps": 6660, "total_steps": 7064, "loss": 0.7729, "reward": null, "learning_rate": 4.044305824082717e-07, "epoch": 1.89, "percentage": 94.28, "elapsed_time": "18:48:46", "remaining_time": "1:08:28"} +{"current_steps": 6660, "total_steps": 7064, "loss": 0.7729, "reward": null, "learning_rate": 4.044305824082717e-07, "epoch": 1.89, "percentage": 94.28, "elapsed_time": "18:48:45", "remaining_time": "1:08:28"} +{"current_steps": 6660, "total_steps": 7064, "loss": 0.7729, "reward": null, "learning_rate": 4.044305824082717e-07, "epoch": 1.89, "percentage": 94.28, "elapsed_time": "18:52:38", "remaining_time": "1:08:42"} +{"current_steps": 6670, "total_steps": 7064, "loss": 0.7824, "reward": null, "learning_rate": 3.84756024889868e-07, "epoch": 1.89, "percentage": 94.42, "elapsed_time": "18:54:19", "remaining_time": "1:07:00"} +{"current_steps": 6670, "total_steps": 7064, "loss": 0.7824, "reward": null, "learning_rate": 3.84756024889868e-07, "epoch": 1.89, "percentage": 94.42, "elapsed_time": "18:50:26", "remaining_time": "1:06:46"} +{"current_steps": 6670, "total_steps": 7064, "loss": 0.7824, "reward": null, "learning_rate": 3.84756024889868e-07, "epoch": 1.89, "percentage": 94.42, "elapsed_time": "18:50:27", "remaining_time": "1:06:46"} +{"current_steps": 6670, "total_steps": 7064, "loss": 0.7824, "reward": null, "learning_rate": 3.84756024889868e-07, "epoch": 1.89, "percentage": 94.42, "elapsed_time": "18:50:28", "remaining_time": "1:06:46"} +{"current_steps": 6680, "total_steps": 7064, "loss": 0.7662, "reward": null, "learning_rate": 3.6556832479123504e-07, "epoch": 1.89, "percentage": 94.56, "elapsed_time": "18:56:04", "remaining_time": "1:05:18"} +{"current_steps": 6680, "total_steps": 7064, "loss": 0.7662, "reward": null, "learning_rate": 3.6556832479123504e-07, "epoch": 1.89, "percentage": 94.56, "elapsed_time": "18:52:11", "remaining_time": "1:05:05"} +{"current_steps": 6680, "total_steps": 7064, "loss": 0.7662, "reward": null, "learning_rate": 3.6556832479123504e-07, "epoch": 1.89, "percentage": 94.56, "elapsed_time": "18:52:11", "remaining_time": "1:05:05"} +{"current_steps": 6680, "total_steps": 7064, "loss": 0.7662, "reward": null, "learning_rate": 3.6556832479123504e-07, "epoch": 1.89, "percentage": 94.56, "elapsed_time": "18:52:13", "remaining_time": "1:05:05"} +{"current_steps": 6690, "total_steps": 7064, "loss": 0.7981, "reward": null, "learning_rate": 3.468678616200427e-07, "epoch": 1.89, "percentage": 94.71, "elapsed_time": "18:53:55", "remaining_time": "1:03:23"} +{"current_steps": 6690, "total_steps": 7064, "loss": 0.7981, "reward": null, "learning_rate": 3.468678616200427e-07, "epoch": 1.89, "percentage": 94.71, "elapsed_time": "18:53:53", "remaining_time": "1:03:23"} +{"current_steps": 6690, "total_steps": 7064, "loss": 0.7981, "reward": null, "learning_rate": 3.468678616200427e-07, "epoch": 1.89, "percentage": 94.71, "elapsed_time": "18:53:54", "remaining_time": "1:03:23"} +{"current_steps": 6690, "total_steps": 7064, "loss": 0.7981, "reward": null, "learning_rate": 3.468678616200427e-07, "epoch": 1.89, "percentage": 94.71, "elapsed_time": "18:57:46", "remaining_time": "1:03:36"} +{"current_steps": 6700, "total_steps": 7064, "loss": 0.7806, "reward": null, "learning_rate": 3.2865500524707217e-07, "epoch": 1.9, "percentage": 94.85, "elapsed_time": "18:55:37", "remaining_time": "1:01:41"} +{"current_steps": 6700, "total_steps": 7064, "loss": 0.7806, "reward": null, "learning_rate": 3.2865500524707217e-07, "epoch": 1.9, "percentage": 94.85, "elapsed_time": "18:59:28", "remaining_time": "1:01:54"} +{"current_steps": 6700, "total_steps": 7064, "loss": 0.7806, "reward": null, "learning_rate": 3.2865500524707217e-07, "epoch": 1.9, "percentage": 94.85, "elapsed_time": "18:55:36", "remaining_time": "1:01:41"} +{"current_steps": 6700, "total_steps": 7064, "loss": 0.7806, "reward": null, "learning_rate": 3.2865500524707217e-07, "epoch": 1.9, "percentage": 94.85, "elapsed_time": "18:55:35", "remaining_time": "1:01:41"} +{"current_steps": 6710, "total_steps": 7064, "loss": 0.7858, "reward": null, "learning_rate": 3.109301158988609e-07, "epoch": 1.9, "percentage": 94.99, "elapsed_time": "18:57:16", "remaining_time": "0:59:59"} +{"current_steps": 6710, "total_steps": 7064, "loss": 0.7858, "reward": null, "learning_rate": 3.109301158988609e-07, "epoch": 1.9, "percentage": 94.99, "elapsed_time": "18:57:18", "remaining_time": "1:00:00"} +{"current_steps": 6710, "total_steps": 7064, "loss": 0.7858, "reward": null, "learning_rate": 3.109301158988609e-07, "epoch": 1.9, "percentage": 94.99, "elapsed_time": "19:01:09", "remaining_time": "1:00:12"} +{"current_steps": 6710, "total_steps": 7064, "loss": 0.7858, "reward": null, "learning_rate": 3.109301158988609e-07, "epoch": 1.9, "percentage": 94.99, "elapsed_time": "18:57:17", "remaining_time": "1:00:00"} +{"current_steps": 6720, "total_steps": 7064, "loss": 0.7827, "reward": null, "learning_rate": 2.936935441506028e-07, "epoch": 1.9, "percentage": 95.13, "elapsed_time": "19:02:50", "remaining_time": "0:58:30"} +{"current_steps": 6720, "total_steps": 7064, "loss": 0.7827, "reward": null, "learning_rate": 2.936935441506028e-07, "epoch": 1.9, "percentage": 95.13, "elapsed_time": "18:58:57", "remaining_time": "0:58:18"} +{"current_steps": 6720, "total_steps": 7064, "loss": 0.7827, "reward": null, "learning_rate": 2.936935441506028e-07, "epoch": 1.9, "percentage": 95.13, "elapsed_time": "18:58:58", "remaining_time": "0:58:18"} +{"current_steps": 6720, "total_steps": 7064, "loss": 0.7827, "reward": null, "learning_rate": 2.936935441506028e-07, "epoch": 1.9, "percentage": 95.13, "elapsed_time": "18:58:59", "remaining_time": "0:58:18"} +{"current_steps": 6730, "total_steps": 7064, "loss": 0.7784, "reward": null, "learning_rate": 2.769456309192037e-07, "epoch": 1.91, "percentage": 95.27, "elapsed_time": "19:00:41", "remaining_time": "0:56:36"} +{"current_steps": 6730, "total_steps": 7064, "loss": 0.7784, "reward": null, "learning_rate": 2.769456309192037e-07, "epoch": 1.91, "percentage": 95.27, "elapsed_time": "19:04:33", "remaining_time": "0:56:48"} +{"current_steps": 6730, "total_steps": 7064, "loss": 0.7784, "reward": null, "learning_rate": 2.769456309192037e-07, "epoch": 1.91, "percentage": 95.27, "elapsed_time": "19:00:39", "remaining_time": "0:56:36"} +{"current_steps": 6730, "total_steps": 7064, "loss": 0.7784, "reward": null, "learning_rate": 2.769456309192037e-07, "epoch": 1.91, "percentage": 95.27, "elapsed_time": "19:00:40", "remaining_time": "0:56:36"} +{"current_steps": 6740, "total_steps": 7064, "loss": 0.7761, "reward": null, "learning_rate": 2.6068670745654224e-07, "epoch": 1.91, "percentage": 95.41, "elapsed_time": "19:02:27", "remaining_time": "0:54:55"} +{"current_steps": 6740, "total_steps": 7064, "loss": 0.7761, "reward": null, "learning_rate": 2.6068670745654224e-07, "epoch": 1.91, "percentage": 95.41, "elapsed_time": "19:06:18", "remaining_time": "0:55:06"} +{"current_steps": 6740, "total_steps": 7064, "loss": 0.7761, "reward": null, "learning_rate": 2.6068670745654224e-07, "epoch": 1.91, "percentage": 95.41, "elapsed_time": "19:02:25", "remaining_time": "0:54:55"} +{"current_steps": 6740, "total_steps": 7064, "loss": 0.7761, "reward": null, "learning_rate": 2.6068670745654224e-07, "epoch": 1.91, "percentage": 95.41, "elapsed_time": "19:02:26", "remaining_time": "0:54:55"} +{"current_steps": 6750, "total_steps": 7064, "loss": 0.7732, "reward": null, "learning_rate": 2.449170953429225e-07, "epoch": 1.91, "percentage": 95.55, "elapsed_time": "19:08:01", "remaining_time": "0:53:24"} +{"current_steps": 6750, "total_steps": 7064, "loss": 0.7732, "reward": null, "learning_rate": 2.449170953429225e-07, "epoch": 1.91, "percentage": 95.55, "elapsed_time": "19:04:08", "remaining_time": "0:53:13"} +{"current_steps": 6750, "total_steps": 7064, "loss": 0.7732, "reward": null, "learning_rate": 2.449170953429225e-07, "epoch": 1.91, "percentage": 95.55, "elapsed_time": "19:04:08", "remaining_time": "0:53:13"} +{"current_steps": 6750, "total_steps": 7064, "loss": 0.7732, "reward": null, "learning_rate": 2.449170953429225e-07, "epoch": 1.91, "percentage": 95.55, "elapsed_time": "19:04:10", "remaining_time": "0:53:13"} +{"current_steps": 6760, "total_steps": 7064, "loss": 0.7899, "reward": null, "learning_rate": 2.296371064806957e-07, "epoch": 1.91, "percentage": 95.7, "elapsed_time": "19:05:51", "remaining_time": "0:51:31"} +{"current_steps": 6760, "total_steps": 7064, "loss": 0.7899, "reward": null, "learning_rate": 2.296371064806957e-07, "epoch": 1.91, "percentage": 95.7, "elapsed_time": "19:09:43", "remaining_time": "0:51:42"} +{"current_steps": 6760, "total_steps": 7064, "loss": 0.7899, "reward": null, "learning_rate": 2.296371064806957e-07, "epoch": 1.91, "percentage": 95.7, "elapsed_time": "19:05:50", "remaining_time": "0:51:31"} +{"current_steps": 6760, "total_steps": 7064, "loss": 0.7899, "reward": null, "learning_rate": 2.296371064806957e-07, "epoch": 1.91, "percentage": 95.7, "elapsed_time": "19:05:49", "remaining_time": "0:51:31"} +{"current_steps": 6770, "total_steps": 7064, "loss": 0.7839, "reward": null, "learning_rate": 2.1484704308812053e-07, "epoch": 1.92, "percentage": 95.84, "elapsed_time": "19:11:23", "remaining_time": "0:50:00"} +{"current_steps": 6770, "total_steps": 7064, "loss": 0.7839, "reward": null, "learning_rate": 2.1484704308812053e-07, "epoch": 1.92, "percentage": 95.84, "elapsed_time": "19:07:30", "remaining_time": "0:49:49"} +{"current_steps": 6770, "total_steps": 7064, "loss": 0.7839, "reward": null, "learning_rate": 2.1484704308812053e-07, "epoch": 1.92, "percentage": 95.84, "elapsed_time": "19:07:32", "remaining_time": "0:49:50"} +{"current_steps": 6770, "total_steps": 7064, "loss": 0.7839, "reward": null, "learning_rate": 2.1484704308812053e-07, "epoch": 1.92, "percentage": 95.84, "elapsed_time": "19:07:31", "remaining_time": "0:49:49"} +{"current_steps": 6780, "total_steps": 7064, "loss": 0.7831, "reward": null, "learning_rate": 2.0054719769335428e-07, "epoch": 1.92, "percentage": 95.98, "elapsed_time": "19:09:14", "remaining_time": "0:48:08"} +{"current_steps": 6780, "total_steps": 7064, "loss": 0.7831, "reward": null, "learning_rate": 2.0054719769335428e-07, "epoch": 1.92, "percentage": 95.98, "elapsed_time": "19:13:05", "remaining_time": "0:48:18"} +{"current_steps": 6780, "total_steps": 7064, "loss": 0.7831, "reward": null, "learning_rate": 2.0054719769335428e-07, "epoch": 1.92, "percentage": 95.98, "elapsed_time": "19:09:12", "remaining_time": "0:48:08"} +{"current_steps": 6780, "total_steps": 7064, "loss": 0.7831, "reward": null, "learning_rate": 2.0054719769335428e-07, "epoch": 1.92, "percentage": 95.98, "elapsed_time": "19:09:12", "remaining_time": "0:48:08"} +{"current_steps": 6790, "total_steps": 7064, "loss": 0.7817, "reward": null, "learning_rate": 1.8673785312869063e-07, "epoch": 1.92, "percentage": 96.12, "elapsed_time": "19:10:57", "remaining_time": "0:46:26"} +{"current_steps": 6790, "total_steps": 7064, "loss": 0.7817, "reward": null, "learning_rate": 1.8673785312869063e-07, "epoch": 1.92, "percentage": 96.12, "elapsed_time": "19:14:48", "remaining_time": "0:46:36"} +{"current_steps": 6790, "total_steps": 7064, "loss": 0.7817, "reward": null, "learning_rate": 1.8673785312869063e-07, "epoch": 1.92, "percentage": 96.12, "elapsed_time": "19:10:56", "remaining_time": "0:46:26"} +{"current_steps": 6790, "total_steps": 7064, "loss": 0.7817, "reward": null, "learning_rate": 1.8673785312869063e-07, "epoch": 1.92, "percentage": 96.12, "elapsed_time": "19:10:55", "remaining_time": "0:46:26"} +{"current_steps": 6800, "total_steps": 7064, "loss": 0.792, "reward": null, "learning_rate": 1.7341928252495033e-07, "epoch": 1.93, "percentage": 96.26, "elapsed_time": "19:16:34", "remaining_time": "0:44:54"} +{"current_steps": 6800, "total_steps": 7064, "loss": 0.792, "reward": null, "learning_rate": 1.7341928252495033e-07, "epoch": 1.93, "percentage": 96.26, "elapsed_time": "19:12:43", "remaining_time": "0:44:45"} +{"current_steps": 6800, "total_steps": 7064, "loss": 0.792, "reward": null, "learning_rate": 1.7341928252495033e-07, "epoch": 1.93, "percentage": 96.26, "elapsed_time": "19:12:41", "remaining_time": "0:44:45"} +{"current_steps": 6800, "total_steps": 7064, "loss": 0.792, "reward": null, "learning_rate": 1.7341928252495033e-07, "epoch": 1.93, "percentage": 96.26, "elapsed_time": "19:12:41", "remaining_time": "0:44:45"} +{"current_steps": 6810, "total_steps": 7064, "loss": 0.7942, "reward": null, "learning_rate": 1.60591749306091e-07, "epoch": 1.93, "percentage": 96.4, "elapsed_time": "19:14:23", "remaining_time": "0:43:03"} +{"current_steps": 6810, "total_steps": 7064, "loss": 0.7942, "reward": null, "learning_rate": 1.60591749306091e-07, "epoch": 1.93, "percentage": 96.4, "elapsed_time": "19:18:15", "remaining_time": "0:43:12"} +{"current_steps": 6810, "total_steps": 7064, "loss": 0.7942, "reward": null, "learning_rate": 1.60591749306091e-07, "epoch": 1.93, "percentage": 96.4, "elapsed_time": "19:14:21", "remaining_time": "0:43:03"} +{"current_steps": 6810, "total_steps": 7064, "loss": 0.7942, "reward": null, "learning_rate": 1.60591749306091e-07, "epoch": 1.93, "percentage": 96.4, "elapsed_time": "19:14:22", "remaining_time": "0:43:03"} +{"current_steps": 6820, "total_steps": 7064, "loss": 0.7607, "reward": null, "learning_rate": 1.4825550718398362e-07, "epoch": 1.93, "percentage": 96.55, "elapsed_time": "19:16:04", "remaining_time": "0:41:21"} +{"current_steps": 6820, "total_steps": 7064, "loss": 0.7607, "reward": null, "learning_rate": 1.4825550718398362e-07, "epoch": 1.93, "percentage": 96.55, "elapsed_time": "19:16:02", "remaining_time": "0:41:21"} +{"current_steps": 6820, "total_steps": 7064, "loss": 0.7607, "reward": null, "learning_rate": 1.4825550718398362e-07, "epoch": 1.93, "percentage": 96.55, "elapsed_time": "19:16:03", "remaining_time": "0:41:21"} +{"current_steps": 6820, "total_steps": 7064, "loss": 0.7607, "reward": null, "learning_rate": 1.4825550718398362e-07, "epoch": 1.93, "percentage": 96.55, "elapsed_time": "19:19:56", "remaining_time": "0:41:29"} +{"current_steps": 6830, "total_steps": 7064, "loss": 0.7743, "reward": null, "learning_rate": 1.3641080015341369e-07, "epoch": 1.93, "percentage": 96.69, "elapsed_time": "19:17:46", "remaining_time": "0:39:39"} +{"current_steps": 6830, "total_steps": 7064, "loss": 0.7743, "reward": null, "learning_rate": 1.3641080015341369e-07, "epoch": 1.93, "percentage": 96.69, "elapsed_time": "19:21:38", "remaining_time": "0:39:47"} +{"current_steps": 6830, "total_steps": 7064, "loss": 0.7743, "reward": null, "learning_rate": 1.3641080015341369e-07, "epoch": 1.93, "percentage": 96.69, "elapsed_time": "19:17:45", "remaining_time": "0:39:39"} +{"current_steps": 6830, "total_steps": 7064, "loss": 0.7743, "reward": null, "learning_rate": 1.3641080015341369e-07, "epoch": 1.93, "percentage": 96.69, "elapsed_time": "19:17:44", "remaining_time": "0:39:39"} +{"current_steps": 6840, "total_steps": 7064, "loss": 0.763, "reward": null, "learning_rate": 1.2505786248723229e-07, "epoch": 1.94, "percentage": 96.83, "elapsed_time": "19:19:28", "remaining_time": "0:37:58"} +{"current_steps": 6840, "total_steps": 7064, "loss": 0.763, "reward": null, "learning_rate": 1.2505786248723229e-07, "epoch": 1.94, "percentage": 96.83, "elapsed_time": "19:23:20", "remaining_time": "0:38:05"} +{"current_steps": 6840, "total_steps": 7064, "loss": 0.763, "reward": null, "learning_rate": 1.2505786248723229e-07, "epoch": 1.94, "percentage": 96.83, "elapsed_time": "19:19:27", "remaining_time": "0:37:58"} +{"current_steps": 6840, "total_steps": 7064, "loss": 0.763, "reward": null, "learning_rate": 1.2505786248723229e-07, "epoch": 1.94, "percentage": 96.83, "elapsed_time": "19:19:26", "remaining_time": "0:37:58"} +{"current_steps": 6850, "total_steps": 7064, "loss": 0.7685, "reward": null, "learning_rate": 1.1419691873174043e-07, "epoch": 1.94, "percentage": 96.97, "elapsed_time": "19:21:11", "remaining_time": "0:36:16"} +{"current_steps": 6850, "total_steps": 7064, "loss": 0.7685, "reward": null, "learning_rate": 1.1419691873174043e-07, "epoch": 1.94, "percentage": 96.97, "elapsed_time": "19:25:02", "remaining_time": "0:36:23"} +{"current_steps": 6850, "total_steps": 7064, "loss": 0.7685, "reward": null, "learning_rate": 1.1419691873174043e-07, "epoch": 1.94, "percentage": 96.97, "elapsed_time": "19:21:09", "remaining_time": "0:36:16"} +{"current_steps": 6850, "total_steps": 7064, "loss": 0.7685, "reward": null, "learning_rate": 1.1419691873174043e-07, "epoch": 1.94, "percentage": 96.97, "elapsed_time": "19:21:10", "remaining_time": "0:36:16"} +{"current_steps": 6860, "total_steps": 7064, "loss": 0.7773, "reward": null, "learning_rate": 1.038281837022398e-07, "epoch": 1.94, "percentage": 97.11, "elapsed_time": "19:22:51", "remaining_time": "0:34:34"} +{"current_steps": 6860, "total_steps": 7064, "loss": 0.7773, "reward": null, "learning_rate": 1.038281837022398e-07, "epoch": 1.94, "percentage": 97.11, "elapsed_time": "19:26:42", "remaining_time": "0:34:41"} +{"current_steps": 6860, "total_steps": 7064, "loss": 0.7773, "reward": null, "learning_rate": 1.038281837022398e-07, "epoch": 1.94, "percentage": 97.11, "elapsed_time": "19:22:50", "remaining_time": "0:34:34"} +{"current_steps": 6860, "total_steps": 7064, "loss": 0.7773, "reward": null, "learning_rate": 1.038281837022398e-07, "epoch": 1.94, "percentage": 97.11, "elapsed_time": "19:22:49", "remaining_time": "0:34:34"} +{"current_steps": 6870, "total_steps": 7064, "loss": 0.7663, "reward": null, "learning_rate": 9.395186247878329e-08, "epoch": 1.95, "percentage": 97.25, "elapsed_time": "19:24:34", "remaining_time": "0:32:53"} +{"current_steps": 6870, "total_steps": 7064, "loss": 0.7663, "reward": null, "learning_rate": 9.395186247878329e-08, "epoch": 1.95, "percentage": 97.25, "elapsed_time": "19:24:32", "remaining_time": "0:32:53"} +{"current_steps": 6870, "total_steps": 7064, "loss": 0.7663, "reward": null, "learning_rate": 9.395186247878329e-08, "epoch": 1.95, "percentage": 97.25, "elapsed_time": "19:24:32", "remaining_time": "0:32:53"} +{"current_steps": 6870, "total_steps": 7064, "loss": 0.7663, "reward": null, "learning_rate": 9.395186247878329e-08, "epoch": 1.95, "percentage": 97.25, "elapsed_time": "19:28:25", "remaining_time": "0:32:59"} +{"current_steps": 6880, "total_steps": 7064, "loss": 0.7769, "reward": null, "learning_rate": 8.456815040212562e-08, "epoch": 1.95, "percentage": 97.4, "elapsed_time": "19:26:18", "remaining_time": "0:31:11"} +{"current_steps": 6880, "total_steps": 7064, "loss": 0.7769, "reward": null, "learning_rate": 8.456815040212562e-08, "epoch": 1.95, "percentage": 97.4, "elapsed_time": "19:30:09", "remaining_time": "0:31:17"} +{"current_steps": 6880, "total_steps": 7064, "loss": 0.7769, "reward": null, "learning_rate": 8.456815040212562e-08, "epoch": 1.95, "percentage": 97.4, "elapsed_time": "19:26:17", "remaining_time": "0:31:11"} +{"current_steps": 6880, "total_steps": 7064, "loss": 0.7769, "reward": null, "learning_rate": 8.456815040212562e-08, "epoch": 1.95, "percentage": 97.4, "elapsed_time": "19:26:16", "remaining_time": "0:31:11"} +{"current_steps": 6890, "total_steps": 7064, "loss": 0.7921, "reward": null, "learning_rate": 7.567723306984853e-08, "epoch": 1.95, "percentage": 97.54, "elapsed_time": "19:27:59", "remaining_time": "0:29:29"} +{"current_steps": 6890, "total_steps": 7064, "loss": 0.7921, "reward": null, "learning_rate": 7.567723306984853e-08, "epoch": 1.95, "percentage": 97.54, "elapsed_time": "19:27:58", "remaining_time": "0:29:29"} +{"current_steps": 6890, "total_steps": 7064, "loss": 0.7921, "reward": null, "learning_rate": 7.567723306984853e-08, "epoch": 1.95, "percentage": 97.54, "elapsed_time": "19:27:57", "remaining_time": "0:29:29"} +{"current_steps": 6890, "total_steps": 7064, "loss": 0.7921, "reward": null, "learning_rate": 7.567723306984853e-08, "epoch": 1.95, "percentage": 97.54, "elapsed_time": "19:31:50", "remaining_time": "0:29:35"} +{"current_steps": 6900, "total_steps": 7064, "loss": 0.7877, "reward": null, "learning_rate": 6.727928633270264e-08, "epoch": 1.95, "percentage": 97.68, "elapsed_time": "19:29:42", "remaining_time": "0:27:48"} +{"current_steps": 6900, "total_steps": 7064, "loss": 0.7877, "reward": null, "learning_rate": 6.727928633270264e-08, "epoch": 1.95, "percentage": 97.68, "elapsed_time": "19:29:40", "remaining_time": "0:27:48"} +{"current_steps": 6900, "total_steps": 7064, "loss": 0.7877, "reward": null, "learning_rate": 6.727928633270264e-08, "epoch": 1.95, "percentage": 97.68, "elapsed_time": "19:29:41", "remaining_time": "0:27:48"} +{"current_steps": 6900, "total_steps": 7064, "loss": 0.7877, "reward": null, "learning_rate": 6.727928633270264e-08, "epoch": 1.95, "percentage": 97.68, "elapsed_time": "19:33:33", "remaining_time": "0:27:53"} +{"current_steps": 6910, "total_steps": 7064, "loss": 0.7709, "reward": null, "learning_rate": 5.937447629112414e-08, "epoch": 1.96, "percentage": 97.82, "elapsed_time": "19:31:26", "remaining_time": "0:26:06"} +{"current_steps": 6910, "total_steps": 7064, "loss": 0.7709, "reward": null, "learning_rate": 5.937447629112414e-08, "epoch": 1.96, "percentage": 97.82, "elapsed_time": "19:35:17", "remaining_time": "0:26:11"} +{"current_steps": 6910, "total_steps": 7064, "loss": 0.7709, "reward": null, "learning_rate": 5.937447629112414e-08, "epoch": 1.96, "percentage": 97.82, "elapsed_time": "19:31:25", "remaining_time": "0:26:06"} +{"current_steps": 6910, "total_steps": 7064, "loss": 0.7709, "reward": null, "learning_rate": 5.937447629112414e-08, "epoch": 1.96, "percentage": 97.82, "elapsed_time": "19:31:24", "remaining_time": "0:26:06"} +{"current_steps": 6920, "total_steps": 7064, "loss": 0.7921, "reward": null, "learning_rate": 5.196295929193739e-08, "epoch": 1.96, "percentage": 97.96, "elapsed_time": "19:33:11", "remaining_time": "0:24:24"} +{"current_steps": 6920, "total_steps": 7064, "loss": 0.7921, "reward": null, "learning_rate": 5.196295929193739e-08, "epoch": 1.96, "percentage": 97.96, "elapsed_time": "19:37:02", "remaining_time": "0:24:29"} +{"current_steps": 6920, "total_steps": 7064, "loss": 0.7921, "reward": null, "learning_rate": 5.196295929193739e-08, "epoch": 1.96, "percentage": 97.96, "elapsed_time": "19:33:09", "remaining_time": "0:24:24"} +{"current_steps": 6920, "total_steps": 7064, "loss": 0.7921, "reward": null, "learning_rate": 5.196295929193739e-08, "epoch": 1.96, "percentage": 97.96, "elapsed_time": "19:33:10", "remaining_time": "0:24:24"} +{"current_steps": 6930, "total_steps": 7064, "loss": 0.7707, "reward": null, "learning_rate": 4.5044881925287994e-08, "epoch": 1.96, "percentage": 98.1, "elapsed_time": "19:38:44", "remaining_time": "0:22:47"} +{"current_steps": 6930, "total_steps": 7064, "loss": 0.7707, "reward": null, "learning_rate": 4.5044881925287994e-08, "epoch": 1.96, "percentage": 98.1, "elapsed_time": "19:34:53", "remaining_time": "0:22:43"} +{"current_steps": 6930, "total_steps": 7064, "loss": 0.7707, "reward": null, "learning_rate": 4.5044881925287994e-08, "epoch": 1.96, "percentage": 98.1, "elapsed_time": "19:34:51", "remaining_time": "0:22:43"} +{"current_steps": 6930, "total_steps": 7064, "loss": 0.7707, "reward": null, "learning_rate": 4.5044881925287994e-08, "epoch": 1.96, "percentage": 98.1, "elapsed_time": "19:34:52", "remaining_time": "0:22:43"} +{"current_steps": 6940, "total_steps": 7064, "loss": 0.7752, "reward": null, "learning_rate": 3.862038102172283e-08, "epoch": 1.96, "percentage": 98.24, "elapsed_time": "19:36:35", "remaining_time": "0:21:01"} +{"current_steps": 6940, "total_steps": 7064, "loss": 0.7752, "reward": null, "learning_rate": 3.862038102172283e-08, "epoch": 1.96, "percentage": 98.24, "elapsed_time": "19:40:26", "remaining_time": "0:21:05"} +{"current_steps": 6940, "total_steps": 7064, "loss": 0.7752, "reward": null, "learning_rate": 3.862038102172283e-08, "epoch": 1.96, "percentage": 98.24, "elapsed_time": "19:36:34", "remaining_time": "0:21:01"} +{"current_steps": 6940, "total_steps": 7064, "loss": 0.7752, "reward": null, "learning_rate": 3.862038102172283e-08, "epoch": 1.96, "percentage": 98.24, "elapsed_time": "19:36:33", "remaining_time": "0:21:01"} +{"current_steps": 6950, "total_steps": 7064, "loss": 0.7728, "reward": null, "learning_rate": 3.268958364948671e-08, "epoch": 1.97, "percentage": 98.39, "elapsed_time": "19:38:18", "remaining_time": "0:19:19"} +{"current_steps": 6950, "total_steps": 7064, "loss": 0.7728, "reward": null, "learning_rate": 3.268958364948671e-08, "epoch": 1.97, "percentage": 98.39, "elapsed_time": "19:42:09", "remaining_time": "0:19:23"} +{"current_steps": 6950, "total_steps": 7064, "loss": 0.7728, "reward": null, "learning_rate": 3.268958364948671e-08, "epoch": 1.97, "percentage": 98.39, "elapsed_time": "19:38:17", "remaining_time": "0:19:19"} +{"current_steps": 6950, "total_steps": 7064, "loss": 0.7728, "reward": null, "learning_rate": 3.268958364948671e-08, "epoch": 1.97, "percentage": 98.39, "elapsed_time": "19:38:16", "remaining_time": "0:19:19"} +{"current_steps": 6960, "total_steps": 7064, "loss": 0.7651, "reward": null, "learning_rate": 2.7252607112018823e-08, "epoch": 1.97, "percentage": 98.53, "elapsed_time": "19:39:59", "remaining_time": "0:17:37"} +{"current_steps": 6960, "total_steps": 7064, "loss": 0.7651, "reward": null, "learning_rate": 2.7252607112018823e-08, "epoch": 1.97, "percentage": 98.53, "elapsed_time": "19:40:01", "remaining_time": "0:17:37"} +{"current_steps": 6960, "total_steps": 7064, "loss": 0.7651, "reward": null, "learning_rate": 2.7252607112018823e-08, "epoch": 1.97, "percentage": 98.53, "elapsed_time": "19:39:59", "remaining_time": "0:17:37"} +{"current_steps": 6960, "total_steps": 7064, "loss": 0.7651, "reward": null, "learning_rate": 2.7252607112018823e-08, "epoch": 1.97, "percentage": 98.53, "elapsed_time": "19:43:52", "remaining_time": "0:17:41"} +{"current_steps": 6970, "total_steps": 7064, "loss": 0.7892, "reward": null, "learning_rate": 2.2309558945621257e-08, "epoch": 1.97, "percentage": 98.67, "elapsed_time": "19:41:37", "remaining_time": "0:15:56"} +{"current_steps": 6970, "total_steps": 7064, "loss": 0.7892, "reward": null, "learning_rate": 2.2309558945621257e-08, "epoch": 1.97, "percentage": 98.67, "elapsed_time": "19:45:30", "remaining_time": "0:15:59"} +{"current_steps": 6970, "total_steps": 7064, "loss": 0.7892, "reward": null, "learning_rate": 2.2309558945621257e-08, "epoch": 1.97, "percentage": 98.67, "elapsed_time": "19:41:37", "remaining_time": "0:15:56"} +{"current_steps": 6970, "total_steps": 7064, "loss": 0.7892, "reward": null, "learning_rate": 2.2309558945621257e-08, "epoch": 1.97, "percentage": 98.67, "elapsed_time": "19:41:39", "remaining_time": "0:15:56"} +{"current_steps": 6980, "total_steps": 7064, "loss": 0.7671, "reward": null, "learning_rate": 1.7860536917341243e-08, "epoch": 1.98, "percentage": 98.81, "elapsed_time": "19:47:17", "remaining_time": "0:14:17"} +{"current_steps": 6980, "total_steps": 7064, "loss": 0.7671, "reward": null, "learning_rate": 1.7860536917341243e-08, "epoch": 1.98, "percentage": 98.81, "elapsed_time": "19:43:25", "remaining_time": "0:14:14"} +{"current_steps": 6980, "total_steps": 7064, "loss": 0.7671, "reward": null, "learning_rate": 1.7860536917341243e-08, "epoch": 1.98, "percentage": 98.81, "elapsed_time": "19:43:24", "remaining_time": "0:14:14"} +{"current_steps": 6980, "total_steps": 7064, "loss": 0.7671, "reward": null, "learning_rate": 1.7860536917341243e-08, "epoch": 1.98, "percentage": 98.81, "elapsed_time": "19:43:23", "remaining_time": "0:14:14"} +{"current_steps": 6990, "total_steps": 7064, "loss": 0.7767, "reward": null, "learning_rate": 1.3905629023031052e-08, "epoch": 1.98, "percentage": 98.95, "elapsed_time": "19:45:09", "remaining_time": "0:12:32"} +{"current_steps": 6990, "total_steps": 7064, "loss": 0.7767, "reward": null, "learning_rate": 1.3905629023031052e-08, "epoch": 1.98, "percentage": 98.95, "elapsed_time": "19:49:00", "remaining_time": "0:12:35"} +{"current_steps": 6990, "total_steps": 7064, "loss": 0.7767, "reward": null, "learning_rate": 1.3905629023031052e-08, "epoch": 1.98, "percentage": 98.95, "elapsed_time": "19:45:08", "remaining_time": "0:12:32"} +{"current_steps": 6990, "total_steps": 7064, "loss": 0.7767, "reward": null, "learning_rate": 1.3905629023031052e-08, "epoch": 1.98, "percentage": 98.95, "elapsed_time": "19:45:07", "remaining_time": "0:12:32"} +{"current_steps": 7000, "total_steps": 7064, "loss": 0.7847, "reward": null, "learning_rate": 1.0444913485610498e-08, "epoch": 1.98, "percentage": 99.09, "elapsed_time": "19:46:56", "remaining_time": "0:10:51"} +{"current_steps": 7000, "total_steps": 7064, "loss": 0.7847, "reward": null, "learning_rate": 1.0444913485610498e-08, "epoch": 1.98, "percentage": 99.09, "elapsed_time": "19:50:48", "remaining_time": "0:10:53"} +{"current_steps": 7000, "total_steps": 7064, "loss": 0.7847, "reward": null, "learning_rate": 1.0444913485610498e-08, "epoch": 1.98, "percentage": 99.09, "elapsed_time": "19:46:55", "remaining_time": "0:10:51"} +{"current_steps": 7000, "total_steps": 7064, "loss": 0.7847, "reward": null, "learning_rate": 1.0444913485610498e-08, "epoch": 1.98, "percentage": 99.09, "elapsed_time": "19:46:54", "remaining_time": "0:10:51"} +{"current_steps": 7010, "total_steps": 7064, "loss": 0.7814, "reward": null, "learning_rate": 7.478458753518159e-09, "epoch": 1.98, "percentage": 99.24, "elapsed_time": "19:52:30", "remaining_time": "0:09:11"} +{"current_steps": 7010, "total_steps": 7064, "loss": 0.7814, "reward": null, "learning_rate": 7.478458753518159e-09, "epoch": 1.98, "percentage": 99.24, "elapsed_time": "19:48:37", "remaining_time": "0:09:09"} +{"current_steps": 7010, "total_steps": 7064, "loss": 0.7814, "reward": null, "learning_rate": 7.478458753518159e-09, "epoch": 1.98, "percentage": 99.24, "elapsed_time": "19:48:38", "remaining_time": "0:09:09"} +{"current_steps": 7010, "total_steps": 7064, "loss": 0.7814, "reward": null, "learning_rate": 7.478458753518159e-09, "epoch": 1.98, "percentage": 99.24, "elapsed_time": "19:48:39", "remaining_time": "0:09:09"} +{"current_steps": 7020, "total_steps": 7064, "loss": 0.7902, "reward": null, "learning_rate": 5.006323499359699e-09, "epoch": 1.99, "percentage": 99.38, "elapsed_time": "19:54:13", "remaining_time": "0:07:29"} +{"current_steps": 7020, "total_steps": 7064, "loss": 0.7902, "reward": null, "learning_rate": 5.006323499359699e-09, "epoch": 1.99, "percentage": 99.38, "elapsed_time": "19:50:20", "remaining_time": "0:07:27"} +{"current_steps": 7020, "total_steps": 7064, "loss": 0.7902, "reward": null, "learning_rate": 5.006323499359699e-09, "epoch": 1.99, "percentage": 99.38, "elapsed_time": "19:50:22", "remaining_time": "0:07:27"} +{"current_steps": 7020, "total_steps": 7064, "loss": 0.7902, "reward": null, "learning_rate": 5.006323499359699e-09, "epoch": 1.99, "percentage": 99.38, "elapsed_time": "19:50:21", "remaining_time": "0:07:27"} +{"current_steps": 7030, "total_steps": 7064, "loss": 0.7684, "reward": null, "learning_rate": 3.02855661874768e-09, "epoch": 1.99, "percentage": 99.52, "elapsed_time": "19:55:55", "remaining_time": "0:05:47"} +{"current_steps": 7030, "total_steps": 7064, "loss": 0.7684, "reward": null, "learning_rate": 3.02855661874768e-09, "epoch": 1.99, "percentage": 99.52, "elapsed_time": "19:52:03", "remaining_time": "0:05:45"} +{"current_steps": 7030, "total_steps": 7064, "loss": 0.7684, "reward": null, "learning_rate": 3.02855661874768e-09, "epoch": 1.99, "percentage": 99.52, "elapsed_time": "19:52:02", "remaining_time": "0:05:45"} +{"current_steps": 7030, "total_steps": 7064, "loss": 0.7684, "reward": null, "learning_rate": 3.02855661874768e-09, "epoch": 1.99, "percentage": 99.52, "elapsed_time": "19:52:04", "remaining_time": "0:05:45"} +{"current_steps": 7040, "total_steps": 7064, "loss": 0.7709, "reward": null, "learning_rate": 1.5451972293301087e-09, "epoch": 1.99, "percentage": 99.66, "elapsed_time": "19:53:46", "remaining_time": "0:04:04"} +{"current_steps": 7040, "total_steps": 7064, "loss": 0.7709, "reward": null, "learning_rate": 1.5451972293301087e-09, "epoch": 1.99, "percentage": 99.66, "elapsed_time": "19:57:37", "remaining_time": "0:04:04"} +{"current_steps": 7040, "total_steps": 7064, "loss": 0.7709, "reward": null, "learning_rate": 1.5451972293301087e-09, "epoch": 1.99, "percentage": 99.66, "elapsed_time": "19:53:45", "remaining_time": "0:04:04"} +{"current_steps": 7040, "total_steps": 7064, "loss": 0.7709, "reward": null, "learning_rate": 1.5451972293301087e-09, "epoch": 1.99, "percentage": 99.66, "elapsed_time": "19:53:44", "remaining_time": "0:04:04"} +{"current_steps": 7050, "total_steps": 7064, "loss": 0.7924, "reward": null, "learning_rate": 5.56274670021617e-10, "epoch": 2.0, "percentage": 99.8, "elapsed_time": "19:59:17", "remaining_time": "0:02:22"} +{"current_steps": 7050, "total_steps": 7064, "loss": 0.7924, "reward": null, "learning_rate": 5.56274670021617e-10, "epoch": 2.0, "percentage": 99.8, "elapsed_time": "19:55:25", "remaining_time": "0:02:22"} +{"current_steps": 7050, "total_steps": 7064, "loss": 0.7924, "reward": null, "learning_rate": 5.56274670021617e-10, "epoch": 2.0, "percentage": 99.8, "elapsed_time": "19:55:24", "remaining_time": "0:02:22"} +{"current_steps": 7050, "total_steps": 7064, "loss": 0.7924, "reward": null, "learning_rate": 5.56274670021617e-10, "epoch": 2.0, "percentage": 99.8, "elapsed_time": "19:55:26", "remaining_time": "0:02:22"} +{"current_steps": 7060, "total_steps": 7064, "loss": 0.8148, "reward": null, "learning_rate": 6.180850041781483e-11, "epoch": 2.0, "percentage": 99.94, "elapsed_time": "19:57:08", "remaining_time": "0:00:40"} +{"current_steps": 7060, "total_steps": 7064, "loss": 0.8148, "reward": null, "learning_rate": 6.180850041781483e-11, "epoch": 2.0, "percentage": 99.94, "elapsed_time": "20:01:00", "remaining_time": "0:00:40"} +{"current_steps": 7060, "total_steps": 7064, "loss": 0.8148, "reward": null, "learning_rate": 6.180850041781483e-11, "epoch": 2.0, "percentage": 99.94, "elapsed_time": "19:57:07", "remaining_time": "0:00:40"} +{"current_steps": 7060, "total_steps": 7064, "loss": 0.8148, "reward": null, "learning_rate": 6.180850041781483e-11, "epoch": 2.0, "percentage": 99.94, "elapsed_time": "19:57:06", "remaining_time": "0:00:40"} diff --git a/sft-qlora/trainer_state.json b/sft-qlora/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..d2f04c4a67f3d08b8d414d3fd3ade75e5d866578 --- /dev/null +++ b/sft-qlora/trainer_state.json @@ -0,0 +1,4261 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 2.0, + "global_step": 7064, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.0, + "learning_rate": 4.9999752766303955e-05, + "loss": 1.3185, + "step": 10 + }, + { + "epoch": 0.01, + "learning_rate": 4.999901107010577e-05, + "loss": 1.2795, + "step": 20 + }, + { + "epoch": 0.01, + "learning_rate": 4.999777492607524e-05, + "loss": 1.2266, + "step": 30 + }, + { + "epoch": 0.01, + "learning_rate": 4.9996044358661676e-05, + "loss": 1.19, + "step": 40 + }, + { + "epoch": 0.01, + "learning_rate": 4.9993819402093446e-05, + "loss": 1.1643, + "step": 50 + }, + { + "epoch": 0.02, + "learning_rate": 4.999110010037728e-05, + "loss": 1.1381, + "step": 60 + }, + { + "epoch": 0.02, + "learning_rate": 4.998788650729743e-05, + "loss": 1.1113, + "step": 70 + }, + { + "epoch": 0.02, + "learning_rate": 4.998417868641457e-05, + "loss": 1.0892, + "step": 80 + }, + { + "epoch": 0.03, + "learning_rate": 4.9979976711064556e-05, + "loss": 1.0801, + "step": 90 + }, + { + "epoch": 0.03, + "learning_rate": 4.9975280664357e-05, + "loss": 1.0822, + "step": 100 + }, + { + "epoch": 0.03, + "learning_rate": 4.997009063917356e-05, + "loss": 1.0794, + "step": 110 + }, + { + "epoch": 0.03, + "learning_rate": 4.996440673816617e-05, + "loss": 1.0419, + "step": 120 + }, + { + "epoch": 0.04, + "learning_rate": 4.995822907375498e-05, + "loss": 1.049, + "step": 130 + }, + { + "epoch": 0.04, + "learning_rate": 4.9951557768126136e-05, + "loss": 1.0202, + "step": 140 + }, + { + "epoch": 0.04, + "learning_rate": 4.9944392953229365e-05, + "loss": 1.0226, + "step": 150 + }, + { + "epoch": 0.05, + "learning_rate": 4.993673477077535e-05, + "loss": 0.9927, + "step": 160 + }, + { + "epoch": 0.05, + "learning_rate": 4.9928583372232954e-05, + "loss": 1.0006, + "step": 170 + }, + { + "epoch": 0.05, + "learning_rate": 4.991993891882622e-05, + "loss": 0.9999, + "step": 180 + }, + { + "epoch": 0.05, + "learning_rate": 4.991080158153115e-05, + "loss": 1.0003, + "step": 190 + }, + { + "epoch": 0.06, + "learning_rate": 4.990117154107236e-05, + "loss": 0.9875, + "step": 200 + }, + { + "epoch": 0.06, + "learning_rate": 4.989104898791949e-05, + "loss": 1.004, + "step": 210 + }, + { + "epoch": 0.06, + "learning_rate": 4.988043412228343e-05, + "loss": 0.9835, + "step": 220 + }, + { + "epoch": 0.07, + "learning_rate": 4.986932715411239e-05, + "loss": 0.9765, + "step": 230 + }, + { + "epoch": 0.07, + "learning_rate": 4.985772830308771e-05, + "loss": 0.9755, + "step": 240 + }, + { + "epoch": 0.07, + "learning_rate": 4.9845637798619536e-05, + "loss": 0.9798, + "step": 250 + }, + { + "epoch": 0.07, + "learning_rate": 4.983305587984227e-05, + "loss": 0.9779, + "step": 260 + }, + { + "epoch": 0.08, + "learning_rate": 4.981998279560986e-05, + "loss": 0.9707, + "step": 270 + }, + { + "epoch": 0.08, + "learning_rate": 4.980641880449086e-05, + "loss": 0.987, + "step": 280 + }, + { + "epoch": 0.08, + "learning_rate": 4.9792364174763323e-05, + "loss": 0.9493, + "step": 290 + }, + { + "epoch": 0.08, + "learning_rate": 4.977781918440949e-05, + "loss": 0.9701, + "step": 300 + }, + { + "epoch": 0.09, + "learning_rate": 4.97627841211103e-05, + "loss": 0.9476, + "step": 310 + }, + { + "epoch": 0.09, + "learning_rate": 4.97472592822397e-05, + "loss": 0.9218, + "step": 320 + }, + { + "epoch": 0.09, + "learning_rate": 4.9731244974858746e-05, + "loss": 0.9481, + "step": 330 + }, + { + "epoch": 0.1, + "learning_rate": 4.971474151570955e-05, + "loss": 0.9508, + "step": 340 + }, + { + "epoch": 0.1, + "learning_rate": 4.9697749231209025e-05, + "loss": 0.9587, + "step": 350 + }, + { + "epoch": 0.1, + "learning_rate": 4.968026845744237e-05, + "loss": 0.9371, + "step": 360 + }, + { + "epoch": 0.1, + "learning_rate": 4.96622995401565e-05, + "loss": 0.9242, + "step": 370 + }, + { + "epoch": 0.11, + "learning_rate": 4.9643842834753174e-05, + "loss": 0.9229, + "step": 380 + }, + { + "epoch": 0.11, + "learning_rate": 4.962489870628193e-05, + "loss": 0.9271, + "step": 390 + }, + { + "epoch": 0.11, + "learning_rate": 4.960546752943294e-05, + "loss": 0.9309, + "step": 400 + }, + { + "epoch": 0.12, + "learning_rate": 4.958554968852952e-05, + "loss": 0.9102, + "step": 410 + }, + { + "epoch": 0.12, + "learning_rate": 4.95651455775206e-05, + "loss": 0.9089, + "step": 420 + }, + { + "epoch": 0.12, + "learning_rate": 4.954425559997287e-05, + "loss": 0.9236, + "step": 430 + }, + { + "epoch": 0.12, + "learning_rate": 4.952288016906284e-05, + "loss": 0.9184, + "step": 440 + }, + { + "epoch": 0.13, + "learning_rate": 4.9501019707568665e-05, + "loss": 0.9112, + "step": 450 + }, + { + "epoch": 0.13, + "learning_rate": 4.947867464786174e-05, + "loss": 0.9178, + "step": 460 + }, + { + "epoch": 0.13, + "learning_rate": 4.945584543189823e-05, + "loss": 0.9364, + "step": 470 + }, + { + "epoch": 0.14, + "learning_rate": 4.943253251121022e-05, + "loss": 0.9262, + "step": 480 + }, + { + "epoch": 0.14, + "learning_rate": 4.9408736346896894e-05, + "loss": 0.9037, + "step": 490 + }, + { + "epoch": 0.14, + "learning_rate": 4.938445740961534e-05, + "loss": 0.928, + "step": 500 + }, + { + "epoch": 0.14, + "learning_rate": 4.935969617957126e-05, + "loss": 0.9064, + "step": 510 + }, + { + "epoch": 0.15, + "learning_rate": 4.93344531465095e-05, + "loss": 0.9107, + "step": 520 + }, + { + "epoch": 0.15, + "learning_rate": 4.930872880970432e-05, + "loss": 0.905, + "step": 530 + }, + { + "epoch": 0.15, + "learning_rate": 4.9282523677949556e-05, + "loss": 0.9234, + "step": 540 + }, + { + "epoch": 0.16, + "learning_rate": 4.9255838269548524e-05, + "loss": 0.906, + "step": 550 + }, + { + "epoch": 0.16, + "learning_rate": 4.9228673112303814e-05, + "loss": 0.8885, + "step": 560 + }, + { + "epoch": 0.16, + "learning_rate": 4.9201028743506794e-05, + "loss": 0.9103, + "step": 570 + }, + { + "epoch": 0.16, + "learning_rate": 4.917290570992702e-05, + "loss": 0.895, + "step": 580 + }, + { + "epoch": 0.17, + "learning_rate": 4.9144304567801415e-05, + "loss": 0.8948, + "step": 590 + }, + { + "epoch": 0.17, + "learning_rate": 4.911522588282327e-05, + "loss": 0.9109, + "step": 600 + }, + { + "epoch": 0.17, + "learning_rate": 4.908567023013104e-05, + "loss": 0.8914, + "step": 610 + }, + { + "epoch": 0.18, + "learning_rate": 4.9055638194296994e-05, + "loss": 0.892, + "step": 620 + }, + { + "epoch": 0.18, + "learning_rate": 4.902513036931562e-05, + "loss": 0.9049, + "step": 630 + }, + { + "epoch": 0.18, + "learning_rate": 4.89941473585919e-05, + "loss": 0.904, + "step": 640 + }, + { + "epoch": 0.18, + "learning_rate": 4.89626897749294e-05, + "loss": 0.8983, + "step": 650 + }, + { + "epoch": 0.19, + "learning_rate": 4.893075824051807e-05, + "loss": 0.8884, + "step": 660 + }, + { + "epoch": 0.19, + "learning_rate": 4.889835338692201e-05, + "loss": 0.8886, + "step": 670 + }, + { + "epoch": 0.19, + "learning_rate": 4.886547585506698e-05, + "loss": 0.8998, + "step": 680 + }, + { + "epoch": 0.2, + "learning_rate": 4.8832126295227656e-05, + "loss": 0.8753, + "step": 690 + }, + { + "epoch": 0.2, + "learning_rate": 4.879830536701485e-05, + "loss": 0.8937, + "step": 700 + }, + { + "epoch": 0.2, + "learning_rate": 4.876401373936239e-05, + "loss": 0.8921, + "step": 710 + }, + { + "epoch": 0.2, + "learning_rate": 4.8729252090513964e-05, + "loss": 0.8801, + "step": 720 + }, + { + "epoch": 0.21, + "learning_rate": 4.869402110800963e-05, + "loss": 0.8887, + "step": 730 + }, + { + "epoch": 0.21, + "learning_rate": 4.865832148867228e-05, + "loss": 0.8793, + "step": 740 + }, + { + "epoch": 0.21, + "learning_rate": 4.8622153938593816e-05, + "loss": 0.8811, + "step": 750 + }, + { + "epoch": 0.22, + "learning_rate": 4.8585519173121205e-05, + "loss": 0.8924, + "step": 760 + }, + { + "epoch": 0.22, + "learning_rate": 4.8548417916842324e-05, + "loss": 0.8988, + "step": 770 + }, + { + "epoch": 0.22, + "learning_rate": 4.851085090357163e-05, + "loss": 0.8907, + "step": 780 + }, + { + "epoch": 0.22, + "learning_rate": 4.847281887633565e-05, + "loss": 0.8879, + "step": 790 + }, + { + "epoch": 0.23, + "learning_rate": 4.843432258735827e-05, + "loss": 0.8796, + "step": 800 + }, + { + "epoch": 0.23, + "learning_rate": 4.839536279804589e-05, + "loss": 0.8965, + "step": 810 + }, + { + "epoch": 0.23, + "learning_rate": 4.835594027897231e-05, + "loss": 0.8678, + "step": 820 + }, + { + "epoch": 0.23, + "learning_rate": 4.831605580986355e-05, + "loss": 0.8857, + "step": 830 + }, + { + "epoch": 0.24, + "learning_rate": 4.8275710179582366e-05, + "loss": 0.8805, + "step": 840 + }, + { + "epoch": 0.24, + "learning_rate": 4.823490418611273e-05, + "loss": 0.865, + "step": 850 + }, + { + "epoch": 0.24, + "learning_rate": 4.819363863654395e-05, + "loss": 0.8892, + "step": 860 + }, + { + "epoch": 0.25, + "learning_rate": 4.8151914347054776e-05, + "loss": 0.8589, + "step": 870 + }, + { + "epoch": 0.25, + "learning_rate": 4.810973214289724e-05, + "loss": 0.8819, + "step": 880 + }, + { + "epoch": 0.25, + "learning_rate": 4.806709285838031e-05, + "loss": 0.8778, + "step": 890 + }, + { + "epoch": 0.25, + "learning_rate": 4.8023997336853434e-05, + "loss": 0.8725, + "step": 900 + }, + { + "epoch": 0.26, + "learning_rate": 4.7980446430689804e-05, + "loss": 0.8856, + "step": 910 + }, + { + "epoch": 0.26, + "learning_rate": 4.793644100126954e-05, + "loss": 0.8836, + "step": 920 + }, + { + "epoch": 0.26, + "learning_rate": 4.7891981918962656e-05, + "loss": 0.8684, + "step": 930 + }, + { + "epoch": 0.27, + "learning_rate": 4.784707006311179e-05, + "loss": 0.8671, + "step": 940 + }, + { + "epoch": 0.27, + "learning_rate": 4.780170632201487e-05, + "loss": 0.868, + "step": 950 + }, + { + "epoch": 0.27, + "learning_rate": 4.7755891592907556e-05, + "loss": 0.8683, + "step": 960 + }, + { + "epoch": 0.27, + "learning_rate": 4.7709626781945397e-05, + "loss": 0.8581, + "step": 970 + }, + { + "epoch": 0.28, + "learning_rate": 4.766291280418603e-05, + "loss": 0.8653, + "step": 980 + }, + { + "epoch": 0.28, + "learning_rate": 4.761575058357101e-05, + "loss": 0.8677, + "step": 990 + }, + { + "epoch": 0.28, + "learning_rate": 4.756814105290753e-05, + "loss": 0.8734, + "step": 1000 + }, + { + "epoch": 0.29, + "learning_rate": 4.7520085153850014e-05, + "loss": 0.8583, + "step": 1010 + }, + { + "epoch": 0.29, + "learning_rate": 4.7471583836881476e-05, + "loss": 0.874, + "step": 1020 + }, + { + "epoch": 0.29, + "learning_rate": 4.742263806129469e-05, + "loss": 0.8554, + "step": 1030 + }, + { + "epoch": 0.29, + "learning_rate": 4.737324879517326e-05, + "loss": 0.8807, + "step": 1040 + }, + { + "epoch": 0.3, + "learning_rate": 4.732341701537245e-05, + "loss": 0.8633, + "step": 1050 + }, + { + "epoch": 0.3, + "learning_rate": 4.727314370749988e-05, + "loss": 0.875, + "step": 1060 + }, + { + "epoch": 0.3, + "learning_rate": 4.7222429865896e-05, + "loss": 0.8709, + "step": 1070 + }, + { + "epoch": 0.31, + "learning_rate": 4.717127649361444e-05, + "loss": 0.8634, + "step": 1080 + }, + { + "epoch": 0.31, + "learning_rate": 4.71196846024022e-05, + "loss": 0.8566, + "step": 1090 + }, + { + "epoch": 0.31, + "learning_rate": 4.7067655212679585e-05, + "loss": 0.8667, + "step": 1100 + }, + { + "epoch": 0.31, + "learning_rate": 4.701518935352006e-05, + "loss": 0.8688, + "step": 1110 + }, + { + "epoch": 0.32, + "learning_rate": 4.69622880626299e-05, + "loss": 0.8573, + "step": 1120 + }, + { + "epoch": 0.32, + "learning_rate": 4.690895238632762e-05, + "loss": 0.8576, + "step": 1130 + }, + { + "epoch": 0.32, + "learning_rate": 4.685518337952335e-05, + "loss": 0.8525, + "step": 1140 + }, + { + "epoch": 0.33, + "learning_rate": 4.680098210569789e-05, + "loss": 0.8656, + "step": 1150 + }, + { + "epoch": 0.33, + "learning_rate": 4.674634963688177e-05, + "loss": 0.8703, + "step": 1160 + }, + { + "epoch": 0.33, + "learning_rate": 4.669128705363394e-05, + "loss": 0.8616, + "step": 1170 + }, + { + "epoch": 0.33, + "learning_rate": 4.663579544502049e-05, + "loss": 0.8677, + "step": 1180 + }, + { + "epoch": 0.34, + "learning_rate": 4.657987590859305e-05, + "loss": 0.8525, + "step": 1190 + }, + { + "epoch": 0.34, + "learning_rate": 4.652352955036713e-05, + "loss": 0.8526, + "step": 1200 + }, + { + "epoch": 0.34, + "learning_rate": 4.646675748480019e-05, + "loss": 0.8586, + "step": 1210 + }, + { + "epoch": 0.35, + "learning_rate": 4.640956083476964e-05, + "loss": 0.8542, + "step": 1220 + }, + { + "epoch": 0.35, + "learning_rate": 4.635194073155061e-05, + "loss": 0.8517, + "step": 1230 + }, + { + "epoch": 0.35, + "learning_rate": 4.62938983147936e-05, + "loss": 0.8592, + "step": 1240 + }, + { + "epoch": 0.35, + "learning_rate": 4.62354347325019e-05, + "loss": 0.8678, + "step": 1250 + }, + { + "epoch": 0.36, + "learning_rate": 4.6176551141008916e-05, + "loss": 0.8644, + "step": 1260 + }, + { + "epoch": 0.36, + "learning_rate": 4.611724870495528e-05, + "loss": 0.8541, + "step": 1270 + }, + { + "epoch": 0.36, + "learning_rate": 4.605752859726583e-05, + "loss": 0.8438, + "step": 1280 + }, + { + "epoch": 0.37, + "learning_rate": 4.5997391999126397e-05, + "loss": 0.8604, + "step": 1290 + }, + { + "epoch": 0.37, + "learning_rate": 4.5936840099960465e-05, + "loss": 0.8633, + "step": 1300 + }, + { + "epoch": 0.37, + "learning_rate": 4.587587409740561e-05, + "loss": 0.8437, + "step": 1310 + }, + { + "epoch": 0.37, + "learning_rate": 4.581449519728986e-05, + "loss": 0.8466, + "step": 1320 + }, + { + "epoch": 0.38, + "learning_rate": 4.575270461360779e-05, + "loss": 0.8457, + "step": 1330 + }, + { + "epoch": 0.38, + "learning_rate": 4.569050356849655e-05, + "loss": 0.8477, + "step": 1340 + }, + { + "epoch": 0.38, + "learning_rate": 4.562789329221169e-05, + "loss": 0.8608, + "step": 1350 + }, + { + "epoch": 0.39, + "learning_rate": 4.5564875023102796e-05, + "loss": 0.8555, + "step": 1360 + }, + { + "epoch": 0.39, + "learning_rate": 4.550145000758905e-05, + "loss": 0.8624, + "step": 1370 + }, + { + "epoch": 0.39, + "learning_rate": 4.543761950013453e-05, + "loss": 0.8613, + "step": 1380 + }, + { + "epoch": 0.39, + "learning_rate": 4.537338476322341e-05, + "loss": 0.849, + "step": 1390 + }, + { + "epoch": 0.4, + "learning_rate": 4.530874706733502e-05, + "loss": 0.858, + "step": 1400 + }, + { + "epoch": 0.4, + "learning_rate": 4.524370769091866e-05, + "loss": 0.8468, + "step": 1410 + }, + { + "epoch": 0.4, + "learning_rate": 4.5178267920368366e-05, + "loss": 0.8624, + "step": 1420 + }, + { + "epoch": 0.4, + "learning_rate": 4.511242904999746e-05, + "loss": 0.8464, + "step": 1430 + }, + { + "epoch": 0.41, + "learning_rate": 4.50461923820129e-05, + "loss": 0.8575, + "step": 1440 + }, + { + "epoch": 0.41, + "learning_rate": 4.497955922648961e-05, + "loss": 0.8587, + "step": 1450 + }, + { + "epoch": 0.41, + "learning_rate": 4.491253090134447e-05, + "loss": 0.8517, + "step": 1460 + }, + { + "epoch": 0.42, + "learning_rate": 4.4845108732310355e-05, + "loss": 0.8427, + "step": 1470 + }, + { + "epoch": 0.42, + "learning_rate": 4.4777294052909804e-05, + "loss": 0.8588, + "step": 1480 + }, + { + "epoch": 0.42, + "learning_rate": 4.470908820442873e-05, + "loss": 0.8516, + "step": 1490 + }, + { + "epoch": 0.42, + "learning_rate": 4.464049253588985e-05, + "loss": 0.8408, + "step": 1500 + }, + { + "epoch": 0.43, + "learning_rate": 4.457150840402604e-05, + "loss": 0.8513, + "step": 1510 + }, + { + "epoch": 0.43, + "learning_rate": 4.450213717325343e-05, + "loss": 0.8554, + "step": 1520 + }, + { + "epoch": 0.43, + "learning_rate": 4.443238021564448e-05, + "loss": 0.8598, + "step": 1530 + }, + { + "epoch": 0.44, + "learning_rate": 4.4362238910900835e-05, + "loss": 0.8495, + "step": 1540 + }, + { + "epoch": 0.44, + "learning_rate": 4.4291714646326024e-05, + "loss": 0.8338, + "step": 1550 + }, + { + "epoch": 0.44, + "learning_rate": 4.4220808816797995e-05, + "loss": 0.8576, + "step": 1560 + }, + { + "epoch": 0.44, + "learning_rate": 4.414952282474158e-05, + "loss": 0.8593, + "step": 1570 + }, + { + "epoch": 0.45, + "learning_rate": 4.407785808010073e-05, + "loss": 0.8534, + "step": 1580 + }, + { + "epoch": 0.45, + "learning_rate": 4.400581600031062e-05, + "loss": 0.8564, + "step": 1590 + }, + { + "epoch": 0.45, + "learning_rate": 4.3933398010269614e-05, + "loss": 0.8446, + "step": 1600 + }, + { + "epoch": 0.46, + "learning_rate": 4.386060554231111e-05, + "loss": 0.8445, + "step": 1610 + }, + { + "epoch": 0.46, + "learning_rate": 4.378744003617517e-05, + "loss": 0.8281, + "step": 1620 + }, + { + "epoch": 0.46, + "learning_rate": 4.371390293898007e-05, + "loss": 0.8449, + "step": 1630 + }, + { + "epoch": 0.46, + "learning_rate": 4.3639995705193684e-05, + "loss": 0.8405, + "step": 1640 + }, + { + "epoch": 0.47, + "learning_rate": 4.3565719796604706e-05, + "loss": 0.8349, + "step": 1650 + }, + { + "epoch": 0.47, + "learning_rate": 4.3491076682293715e-05, + "loss": 0.8311, + "step": 1660 + }, + { + "epoch": 0.47, + "learning_rate": 4.341606783860416e-05, + "loss": 0.8383, + "step": 1670 + }, + { + "epoch": 0.48, + "learning_rate": 4.334069474911313e-05, + "loss": 0.8313, + "step": 1680 + }, + { + "epoch": 0.48, + "learning_rate": 4.326495890460204e-05, + "loss": 0.8424, + "step": 1690 + }, + { + "epoch": 0.48, + "learning_rate": 4.3188861803027094e-05, + "loss": 0.8323, + "step": 1700 + }, + { + "epoch": 0.48, + "learning_rate": 4.3112404949489715e-05, + "loss": 0.8501, + "step": 1710 + }, + { + "epoch": 0.49, + "learning_rate": 4.303558985620673e-05, + "loss": 0.8399, + "step": 1720 + }, + { + "epoch": 0.49, + "learning_rate": 4.2958418042480506e-05, + "loss": 0.8184, + "step": 1730 + }, + { + "epoch": 0.49, + "learning_rate": 4.288089103466886e-05, + "loss": 0.8418, + "step": 1740 + }, + { + "epoch": 0.5, + "learning_rate": 4.280301036615489e-05, + "loss": 0.828, + "step": 1750 + }, + { + "epoch": 0.5, + "learning_rate": 4.272477757731662e-05, + "loss": 0.836, + "step": 1760 + }, + { + "epoch": 0.5, + "learning_rate": 4.2646194215496595e-05, + "loss": 0.825, + "step": 1770 + }, + { + "epoch": 0.5, + "learning_rate": 4.2567261834971206e-05, + "loss": 0.8357, + "step": 1780 + }, + { + "epoch": 0.51, + "learning_rate": 4.248798199691998e-05, + "loss": 0.8498, + "step": 1790 + }, + { + "epoch": 0.51, + "learning_rate": 4.2408356269394714e-05, + "loss": 0.8361, + "step": 1800 + }, + { + "epoch": 0.51, + "learning_rate": 4.2328386227288445e-05, + "loss": 0.8237, + "step": 1810 + }, + { + "epoch": 0.52, + "learning_rate": 4.224807345230429e-05, + "loss": 0.8413, + "step": 1820 + }, + { + "epoch": 0.52, + "learning_rate": 4.21674195329242e-05, + "loss": 0.823, + "step": 1830 + }, + { + "epoch": 0.52, + "learning_rate": 4.208642606437748e-05, + "loss": 0.8501, + "step": 1840 + }, + { + "epoch": 0.52, + "learning_rate": 4.2005094648609325e-05, + "loss": 0.8372, + "step": 1850 + }, + { + "epoch": 0.53, + "learning_rate": 4.192342689424903e-05, + "loss": 0.8072, + "step": 1860 + }, + { + "epoch": 0.53, + "learning_rate": 4.184142441657827e-05, + "loss": 0.8409, + "step": 1870 + }, + { + "epoch": 0.53, + "learning_rate": 4.1759088837499095e-05, + "loss": 0.856, + "step": 1880 + }, + { + "epoch": 0.54, + "learning_rate": 4.167642178550186e-05, + "loss": 0.8428, + "step": 1890 + }, + { + "epoch": 0.54, + "learning_rate": 4.159342489563304e-05, + "loss": 0.8344, + "step": 1900 + }, + { + "epoch": 0.54, + "learning_rate": 4.151009980946287e-05, + "loss": 0.8317, + "step": 1910 + }, + { + "epoch": 0.54, + "learning_rate": 4.142644817505284e-05, + "loss": 0.8172, + "step": 1920 + }, + { + "epoch": 0.55, + "learning_rate": 4.1342471646923196e-05, + "loss": 0.8305, + "step": 1930 + }, + { + "epoch": 0.55, + "learning_rate": 4.1258171886020124e-05, + "loss": 0.8303, + "step": 1940 + }, + { + "epoch": 0.55, + "learning_rate": 4.117355055968295e-05, + "loss": 0.8292, + "step": 1950 + }, + { + "epoch": 0.55, + "learning_rate": 4.1088609341611135e-05, + "loss": 0.8162, + "step": 1960 + }, + { + "epoch": 0.56, + "learning_rate": 4.1003349911831166e-05, + "loss": 0.8344, + "step": 1970 + }, + { + "epoch": 0.56, + "learning_rate": 4.091777395666338e-05, + "loss": 0.8545, + "step": 1980 + }, + { + "epoch": 0.56, + "learning_rate": 4.0831883168688534e-05, + "loss": 0.8305, + "step": 1990 + }, + { + "epoch": 0.57, + "learning_rate": 4.07456792467144e-05, + "loss": 0.8365, + "step": 2000 + }, + { + "epoch": 0.57, + "learning_rate": 4.065916389574211e-05, + "loss": 0.8375, + "step": 2010 + }, + { + "epoch": 0.57, + "learning_rate": 4.057233882693246e-05, + "loss": 0.8351, + "step": 2020 + }, + { + "epoch": 0.57, + "learning_rate": 4.048520575757207e-05, + "loss": 0.8165, + "step": 2030 + }, + { + "epoch": 0.58, + "learning_rate": 4.0397766411039395e-05, + "loss": 0.8194, + "step": 2040 + }, + { + "epoch": 0.58, + "learning_rate": 4.031002251677067e-05, + "loss": 0.8218, + "step": 2050 + }, + { + "epoch": 0.58, + "learning_rate": 4.022197581022567e-05, + "loss": 0.8203, + "step": 2060 + }, + { + "epoch": 0.59, + "learning_rate": 4.0133628032853435e-05, + "loss": 0.832, + "step": 2070 + }, + { + "epoch": 0.59, + "learning_rate": 4.004498093205773e-05, + "loss": 0.8066, + "step": 2080 + }, + { + "epoch": 0.59, + "learning_rate": 3.99560362611626e-05, + "loss": 0.8421, + "step": 2090 + }, + { + "epoch": 0.59, + "learning_rate": 3.986679577937762e-05, + "loss": 0.8217, + "step": 2100 + }, + { + "epoch": 0.6, + "learning_rate": 3.9777261251763145e-05, + "loss": 0.8268, + "step": 2110 + }, + { + "epoch": 0.6, + "learning_rate": 3.9687434449195316e-05, + "loss": 0.8321, + "step": 2120 + }, + { + "epoch": 0.6, + "learning_rate": 3.959731714833115e-05, + "loss": 0.8266, + "step": 2130 + }, + { + "epoch": 0.61, + "learning_rate": 3.95069111315733e-05, + "loss": 0.82, + "step": 2140 + }, + { + "epoch": 0.61, + "learning_rate": 3.9416218187034876e-05, + "loss": 0.8347, + "step": 2150 + }, + { + "epoch": 0.61, + "learning_rate": 3.9325240108504016e-05, + "loss": 0.8472, + "step": 2160 + }, + { + "epoch": 0.61, + "learning_rate": 3.923397869540845e-05, + "loss": 0.8092, + "step": 2170 + }, + { + "epoch": 0.62, + "learning_rate": 3.91424357527799e-05, + "loss": 0.8166, + "step": 2180 + }, + { + "epoch": 0.62, + "learning_rate": 3.905061309121837e-05, + "loss": 0.817, + "step": 2190 + }, + { + "epoch": 0.62, + "learning_rate": 3.895851252685634e-05, + "loss": 0.8073, + "step": 2200 + }, + { + "epoch": 0.63, + "learning_rate": 3.886613588132284e-05, + "loss": 0.8355, + "step": 2210 + }, + { + "epoch": 0.63, + "learning_rate": 3.877348498170743e-05, + "loss": 0.8232, + "step": 2220 + }, + { + "epoch": 0.63, + "learning_rate": 3.868056166052407e-05, + "loss": 0.8312, + "step": 2230 + }, + { + "epoch": 0.63, + "learning_rate": 3.858736775567484e-05, + "loss": 0.8215, + "step": 2240 + }, + { + "epoch": 0.64, + "learning_rate": 3.8493905110413626e-05, + "loss": 0.8263, + "step": 2250 + }, + { + "epoch": 0.64, + "learning_rate": 3.8400175573309646e-05, + "loss": 0.8282, + "step": 2260 + }, + { + "epoch": 0.64, + "learning_rate": 3.83061809982109e-05, + "loss": 0.8337, + "step": 2270 + }, + { + "epoch": 0.65, + "learning_rate": 3.821192324420747e-05, + "loss": 0.8291, + "step": 2280 + }, + { + "epoch": 0.65, + "learning_rate": 3.8117404175594795e-05, + "loss": 0.8444, + "step": 2290 + }, + { + "epoch": 0.65, + "learning_rate": 3.8022625661836775e-05, + "loss": 0.8063, + "step": 2300 + }, + { + "epoch": 0.65, + "learning_rate": 3.792758957752879e-05, + "loss": 0.825, + "step": 2310 + }, + { + "epoch": 0.66, + "learning_rate": 3.783229780236062e-05, + "loss": 0.8244, + "step": 2320 + }, + { + "epoch": 0.66, + "learning_rate": 3.773675222107929e-05, + "loss": 0.8086, + "step": 2330 + }, + { + "epoch": 0.66, + "learning_rate": 3.7640954723451784e-05, + "loss": 0.823, + "step": 2340 + }, + { + "epoch": 0.67, + "learning_rate": 3.7544907204227646e-05, + "loss": 0.8177, + "step": 2350 + }, + { + "epoch": 0.67, + "learning_rate": 3.7448611563101536e-05, + "loss": 0.8142, + "step": 2360 + }, + { + "epoch": 0.67, + "learning_rate": 3.735206970467564e-05, + "loss": 0.8236, + "step": 2370 + }, + { + "epoch": 0.67, + "learning_rate": 3.7255283538421984e-05, + "loss": 0.8169, + "step": 2380 + }, + { + "epoch": 0.68, + "learning_rate": 3.7158254978644703e-05, + "loss": 0.8143, + "step": 2390 + }, + { + "epoch": 0.68, + "learning_rate": 3.706098594444216e-05, + "loss": 0.8061, + "step": 2400 + }, + { + "epoch": 0.68, + "learning_rate": 3.6963478359668966e-05, + "loss": 0.8253, + "step": 2410 + }, + { + "epoch": 0.69, + "learning_rate": 3.6865734152897987e-05, + "loss": 0.812, + "step": 2420 + }, + { + "epoch": 0.69, + "learning_rate": 3.676775525738213e-05, + "loss": 0.8263, + "step": 2430 + }, + { + "epoch": 0.69, + "learning_rate": 3.666954361101616e-05, + "loss": 0.8144, + "step": 2440 + }, + { + "epoch": 0.69, + "learning_rate": 3.657110115629832e-05, + "loss": 0.8089, + "step": 2450 + }, + { + "epoch": 0.7, + "learning_rate": 3.647242984029201e-05, + "loss": 0.8155, + "step": 2460 + }, + { + "epoch": 0.7, + "learning_rate": 3.637353161458713e-05, + "loss": 0.8142, + "step": 2470 + }, + { + "epoch": 0.7, + "learning_rate": 3.627440843526158e-05, + "loss": 0.8192, + "step": 2480 + }, + { + "epoch": 0.7, + "learning_rate": 3.6175062262842585e-05, + "loss": 0.8134, + "step": 2490 + }, + { + "epoch": 0.71, + "learning_rate": 3.607549506226784e-05, + "loss": 0.8175, + "step": 2500 + }, + { + "epoch": 0.71, + "learning_rate": 3.5975708802846725e-05, + "loss": 0.8192, + "step": 2510 + }, + { + "epoch": 0.71, + "learning_rate": 3.587570545822128e-05, + "loss": 0.8348, + "step": 2520 + }, + { + "epoch": 0.72, + "learning_rate": 3.5775487006327215e-05, + "loss": 0.8147, + "step": 2530 + }, + { + "epoch": 0.72, + "learning_rate": 3.567505542935482e-05, + "loss": 0.8235, + "step": 2540 + }, + { + "epoch": 0.72, + "learning_rate": 3.557441271370968e-05, + "loss": 0.8175, + "step": 2550 + }, + { + "epoch": 0.72, + "learning_rate": 3.547356084997344e-05, + "loss": 0.8197, + "step": 2560 + }, + { + "epoch": 0.73, + "learning_rate": 3.537250183286443e-05, + "loss": 0.808, + "step": 2570 + }, + { + "epoch": 0.73, + "learning_rate": 3.527123766119818e-05, + "loss": 0.8154, + "step": 2580 + }, + { + "epoch": 0.73, + "learning_rate": 3.5169770337847935e-05, + "loss": 0.8104, + "step": 2590 + }, + { + "epoch": 0.74, + "learning_rate": 3.5068101869705004e-05, + "loss": 0.8318, + "step": 2600 + }, + { + "epoch": 0.74, + "learning_rate": 3.496623426763908e-05, + "loss": 0.8146, + "step": 2610 + }, + { + "epoch": 0.74, + "learning_rate": 3.486416954645846e-05, + "loss": 0.8097, + "step": 2620 + }, + { + "epoch": 0.74, + "learning_rate": 3.4761909724870205e-05, + "loss": 0.8176, + "step": 2630 + }, + { + "epoch": 0.75, + "learning_rate": 3.4659456825440216e-05, + "loss": 0.8284, + "step": 2640 + }, + { + "epoch": 0.75, + "learning_rate": 3.4556812874553204e-05, + "loss": 0.8159, + "step": 2650 + }, + { + "epoch": 0.75, + "learning_rate": 3.445397990237264e-05, + "loss": 0.8204, + "step": 2660 + }, + { + "epoch": 0.76, + "learning_rate": 3.4350959942800584e-05, + "loss": 0.8013, + "step": 2670 + }, + { + "epoch": 0.76, + "learning_rate": 3.424775503343747e-05, + "loss": 0.8196, + "step": 2680 + }, + { + "epoch": 0.76, + "learning_rate": 3.414436721554179e-05, + "loss": 0.802, + "step": 2690 + }, + { + "epoch": 0.76, + "learning_rate": 3.4040798533989745e-05, + "loss": 0.8204, + "step": 2700 + }, + { + "epoch": 0.77, + "learning_rate": 3.3937051037234745e-05, + "loss": 0.8055, + "step": 2710 + }, + { + "epoch": 0.77, + "learning_rate": 3.3833126777266974e-05, + "loss": 0.8171, + "step": 2720 + }, + { + "epoch": 0.77, + "learning_rate": 3.3729027809572735e-05, + "loss": 0.8222, + "step": 2730 + }, + { + "epoch": 0.78, + "learning_rate": 3.3624756193093835e-05, + "loss": 0.8104, + "step": 2740 + }, + { + "epoch": 0.78, + "learning_rate": 3.3520313990186856e-05, + "loss": 0.8147, + "step": 2750 + }, + { + "epoch": 0.78, + "learning_rate": 3.341570326658232e-05, + "loss": 0.8017, + "step": 2760 + }, + { + "epoch": 0.78, + "learning_rate": 3.331092609134392e-05, + "loss": 0.8059, + "step": 2770 + }, + { + "epoch": 0.79, + "learning_rate": 3.32059845368275e-05, + "loss": 0.8204, + "step": 2780 + }, + { + "epoch": 0.79, + "learning_rate": 3.310088067864015e-05, + "loss": 0.812, + "step": 2790 + }, + { + "epoch": 0.79, + "learning_rate": 3.299561659559909e-05, + "loss": 0.8087, + "step": 2800 + }, + { + "epoch": 0.8, + "learning_rate": 3.289019436969057e-05, + "loss": 0.8038, + "step": 2810 + }, + { + "epoch": 0.8, + "learning_rate": 3.278461608602873e-05, + "loss": 0.8094, + "step": 2820 + }, + { + "epoch": 0.8, + "learning_rate": 3.267888383281431e-05, + "loss": 0.8182, + "step": 2830 + }, + { + "epoch": 0.8, + "learning_rate": 3.257299970129336e-05, + "loss": 0.812, + "step": 2840 + }, + { + "epoch": 0.81, + "learning_rate": 3.246696578571592e-05, + "loss": 0.809, + "step": 2850 + }, + { + "epoch": 0.81, + "learning_rate": 3.236078418329452e-05, + "loss": 0.8288, + "step": 2860 + }, + { + "epoch": 0.81, + "learning_rate": 3.225445699416276e-05, + "loss": 0.808, + "step": 2870 + }, + { + "epoch": 0.82, + "learning_rate": 3.214798632133376e-05, + "loss": 0.8127, + "step": 2880 + }, + { + "epoch": 0.82, + "learning_rate": 3.204137427065857e-05, + "loss": 0.8159, + "step": 2890 + }, + { + "epoch": 0.82, + "learning_rate": 3.193462295078448e-05, + "loss": 0.819, + "step": 2900 + }, + { + "epoch": 0.82, + "learning_rate": 3.1827734473113356e-05, + "loss": 0.8108, + "step": 2910 + }, + { + "epoch": 0.83, + "learning_rate": 3.172071095175989e-05, + "loss": 0.8199, + "step": 2920 + }, + { + "epoch": 0.83, + "learning_rate": 3.1613554503509715e-05, + "loss": 0.7977, + "step": 2930 + }, + { + "epoch": 0.83, + "learning_rate": 3.1506267247777645e-05, + "loss": 0.8171, + "step": 2940 + }, + { + "epoch": 0.84, + "learning_rate": 3.139885130656563e-05, + "loss": 0.8064, + "step": 2950 + }, + { + "epoch": 0.84, + "learning_rate": 3.129130880442091e-05, + "loss": 0.8087, + "step": 2960 + }, + { + "epoch": 0.84, + "learning_rate": 3.118364186839389e-05, + "loss": 0.8023, + "step": 2970 + }, + { + "epoch": 0.84, + "learning_rate": 3.107585262799613e-05, + "loss": 0.7978, + "step": 2980 + }, + { + "epoch": 0.85, + "learning_rate": 3.096794321515823e-05, + "loss": 0.8268, + "step": 2990 + }, + { + "epoch": 0.85, + "learning_rate": 3.0859915764187616e-05, + "loss": 0.8129, + "step": 3000 + }, + { + "epoch": 0.85, + "learning_rate": 3.075177241172637e-05, + "loss": 0.8121, + "step": 3010 + }, + { + "epoch": 0.86, + "learning_rate": 3.064351529670895e-05, + "loss": 0.8018, + "step": 3020 + }, + { + "epoch": 0.86, + "learning_rate": 3.0535146560319895e-05, + "loss": 0.8191, + "step": 3030 + }, + { + "epoch": 0.86, + "learning_rate": 3.0426668345951448e-05, + "loss": 0.813, + "step": 3040 + }, + { + "epoch": 0.86, + "learning_rate": 3.031808279916121e-05, + "loss": 0.8252, + "step": 3050 + }, + { + "epoch": 0.87, + "learning_rate": 3.0209392067629676e-05, + "loss": 0.7995, + "step": 3060 + }, + { + "epoch": 0.87, + "learning_rate": 3.010059830111773e-05, + "loss": 0.8162, + "step": 3070 + }, + { + "epoch": 0.87, + "learning_rate": 2.9991703651424184e-05, + "loss": 0.8175, + "step": 3080 + }, + { + "epoch": 0.87, + "learning_rate": 2.988271027234317e-05, + "loss": 0.8076, + "step": 3090 + }, + { + "epoch": 0.88, + "learning_rate": 2.977362031962158e-05, + "loss": 0.8063, + "step": 3100 + }, + { + "epoch": 0.88, + "learning_rate": 2.966443595091637e-05, + "loss": 0.8159, + "step": 3110 + }, + { + "epoch": 0.88, + "learning_rate": 2.9555159325751947e-05, + "loss": 0.8083, + "step": 3120 + }, + { + "epoch": 0.89, + "learning_rate": 2.9445792605477433e-05, + "loss": 0.807, + "step": 3130 + }, + { + "epoch": 0.89, + "learning_rate": 2.933633795322391e-05, + "loss": 0.8123, + "step": 3140 + }, + { + "epoch": 0.89, + "learning_rate": 2.9226797533861615e-05, + "loss": 0.8107, + "step": 3150 + }, + { + "epoch": 0.89, + "learning_rate": 2.9117173513957186e-05, + "loss": 0.8053, + "step": 3160 + }, + { + "epoch": 0.9, + "learning_rate": 2.900746806173074e-05, + "loss": 0.8068, + "step": 3170 + }, + { + "epoch": 0.9, + "learning_rate": 2.889768334701305e-05, + "loss": 0.8086, + "step": 3180 + }, + { + "epoch": 0.9, + "learning_rate": 2.8787821541202564e-05, + "loss": 0.8042, + "step": 3190 + }, + { + "epoch": 0.91, + "learning_rate": 2.8677884817222505e-05, + "loss": 0.8019, + "step": 3200 + }, + { + "epoch": 0.91, + "learning_rate": 2.856787534947789e-05, + "loss": 0.8117, + "step": 3210 + }, + { + "epoch": 0.91, + "learning_rate": 2.8457795313812507e-05, + "loss": 0.8243, + "step": 3220 + }, + { + "epoch": 0.91, + "learning_rate": 2.8347646887465867e-05, + "loss": 0.7953, + "step": 3230 + }, + { + "epoch": 0.92, + "learning_rate": 2.8237432249030183e-05, + "loss": 0.8042, + "step": 3240 + }, + { + "epoch": 0.92, + "learning_rate": 2.812715357840725e-05, + "loss": 0.799, + "step": 3250 + }, + { + "epoch": 0.92, + "learning_rate": 2.801681305676534e-05, + "loss": 0.8093, + "step": 3260 + }, + { + "epoch": 0.93, + "learning_rate": 2.7906412866496034e-05, + "loss": 0.8048, + "step": 3270 + }, + { + "epoch": 0.93, + "learning_rate": 2.7795955191171114e-05, + "loss": 0.8116, + "step": 3280 + }, + { + "epoch": 0.93, + "learning_rate": 2.7685442215499323e-05, + "loss": 0.8151, + "step": 3290 + }, + { + "epoch": 0.93, + "learning_rate": 2.7574876125283176e-05, + "loss": 0.8017, + "step": 3300 + }, + { + "epoch": 0.94, + "learning_rate": 2.7464259107375722e-05, + "loss": 0.8051, + "step": 3310 + }, + { + "epoch": 0.94, + "learning_rate": 2.7353593349637297e-05, + "loss": 0.803, + "step": 3320 + }, + { + "epoch": 0.94, + "learning_rate": 2.7242881040892255e-05, + "loss": 0.8094, + "step": 3330 + }, + { + "epoch": 0.95, + "learning_rate": 2.713212437088564e-05, + "loss": 0.8186, + "step": 3340 + }, + { + "epoch": 0.95, + "learning_rate": 2.702132553023993e-05, + "loss": 0.8041, + "step": 3350 + }, + { + "epoch": 0.95, + "learning_rate": 2.691048671041169e-05, + "loss": 0.8009, + "step": 3360 + }, + { + "epoch": 0.95, + "learning_rate": 2.6799610103648197e-05, + "loss": 0.7931, + "step": 3370 + }, + { + "epoch": 0.96, + "learning_rate": 2.668869790294411e-05, + "loss": 0.8001, + "step": 3380 + }, + { + "epoch": 0.96, + "learning_rate": 2.6577752301998098e-05, + "loss": 0.8167, + "step": 3390 + }, + { + "epoch": 0.96, + "learning_rate": 2.6466775495169437e-05, + "loss": 0.8114, + "step": 3400 + }, + { + "epoch": 0.97, + "learning_rate": 2.6355769677434628e-05, + "loss": 0.8026, + "step": 3410 + }, + { + "epoch": 0.97, + "learning_rate": 2.6244737044343954e-05, + "loss": 0.8063, + "step": 3420 + }, + { + "epoch": 0.97, + "learning_rate": 2.6133679791978065e-05, + "loss": 0.8087, + "step": 3430 + }, + { + "epoch": 0.97, + "learning_rate": 2.602260011690457e-05, + "loss": 0.812, + "step": 3440 + }, + { + "epoch": 0.98, + "learning_rate": 2.591150021613456e-05, + "loss": 0.7899, + "step": 3450 + }, + { + "epoch": 0.98, + "learning_rate": 2.580038228707916e-05, + "loss": 0.798, + "step": 3460 + }, + { + "epoch": 0.98, + "learning_rate": 2.568924852750607e-05, + "loss": 0.826, + "step": 3470 + }, + { + "epoch": 0.99, + "learning_rate": 2.55781011354961e-05, + "loss": 0.8111, + "step": 3480 + }, + { + "epoch": 0.99, + "learning_rate": 2.5466942309399706e-05, + "loss": 0.7924, + "step": 3490 + }, + { + "epoch": 0.99, + "learning_rate": 2.535577424779347e-05, + "loss": 0.8001, + "step": 3500 + }, + { + "epoch": 0.99, + "learning_rate": 2.5244599149436642e-05, + "loss": 0.7906, + "step": 3510 + }, + { + "epoch": 1.0, + "learning_rate": 2.5133419213227684e-05, + "loss": 0.804, + "step": 3520 + }, + { + "epoch": 1.0, + "learning_rate": 2.5022236638160712e-05, + "loss": 0.8123, + "step": 3530 + }, + { + "epoch": 1.0, + "learning_rate": 2.491105362328204e-05, + "loss": 0.8164, + "step": 3540 + }, + { + "epoch": 1.01, + "learning_rate": 2.4799872367646685e-05, + "loss": 0.8169, + "step": 3550 + }, + { + "epoch": 1.01, + "learning_rate": 2.468869507027486e-05, + "loss": 0.7835, + "step": 3560 + }, + { + "epoch": 1.01, + "learning_rate": 2.457752393010851e-05, + "loss": 0.8199, + "step": 3570 + }, + { + "epoch": 1.01, + "learning_rate": 2.4466361145967782e-05, + "loss": 0.8096, + "step": 3580 + }, + { + "epoch": 1.02, + "learning_rate": 2.4355208916507554e-05, + "loss": 0.7792, + "step": 3590 + }, + { + "epoch": 1.02, + "learning_rate": 2.4244069440173938e-05, + "loss": 0.7789, + "step": 3600 + }, + { + "epoch": 1.02, + "learning_rate": 2.413294491516083e-05, + "loss": 0.8127, + "step": 3610 + }, + { + "epoch": 1.02, + "learning_rate": 2.402183753936639e-05, + "loss": 0.816, + "step": 3620 + }, + { + "epoch": 1.03, + "learning_rate": 2.3910749510349574e-05, + "loss": 0.8045, + "step": 3630 + }, + { + "epoch": 1.03, + "learning_rate": 2.3799683025286727e-05, + "loss": 0.8065, + "step": 3640 + }, + { + "epoch": 1.03, + "learning_rate": 2.3688640280928043e-05, + "loss": 0.8016, + "step": 3650 + }, + { + "epoch": 1.04, + "learning_rate": 2.357762347355418e-05, + "loss": 0.7902, + "step": 3660 + }, + { + "epoch": 1.04, + "learning_rate": 2.346663479893277e-05, + "loss": 0.8044, + "step": 3670 + }, + { + "epoch": 1.04, + "learning_rate": 2.3355676452275057e-05, + "loss": 0.8136, + "step": 3680 + }, + { + "epoch": 1.04, + "learning_rate": 2.3244750628192395e-05, + "loss": 0.7885, + "step": 3690 + }, + { + "epoch": 1.05, + "learning_rate": 2.313385952065291e-05, + "loss": 0.7734, + "step": 3700 + }, + { + "epoch": 1.05, + "learning_rate": 2.302300532293806e-05, + "loss": 0.8117, + "step": 3710 + }, + { + "epoch": 1.05, + "learning_rate": 2.2912190227599305e-05, + "loss": 0.7969, + "step": 3720 + }, + { + "epoch": 1.06, + "learning_rate": 2.280141642641468e-05, + "loss": 0.7741, + "step": 3730 + }, + { + "epoch": 1.06, + "learning_rate": 2.26906861103455e-05, + "loss": 0.7996, + "step": 3740 + }, + { + "epoch": 1.06, + "learning_rate": 2.2580001469492968e-05, + "loss": 0.806, + "step": 3750 + }, + { + "epoch": 1.06, + "learning_rate": 2.2469364693054938e-05, + "loss": 0.7969, + "step": 3760 + }, + { + "epoch": 1.07, + "learning_rate": 2.235877796928252e-05, + "loss": 0.8017, + "step": 3770 + }, + { + "epoch": 1.07, + "learning_rate": 2.2248243485436892e-05, + "loss": 0.8066, + "step": 3780 + }, + { + "epoch": 1.07, + "learning_rate": 2.213776342774595e-05, + "loss": 0.7969, + "step": 3790 + }, + { + "epoch": 1.08, + "learning_rate": 2.2027339981361156e-05, + "loss": 0.8008, + "step": 3800 + }, + { + "epoch": 1.08, + "learning_rate": 2.1916975330314235e-05, + "loss": 0.8111, + "step": 3810 + }, + { + "epoch": 1.08, + "learning_rate": 2.1806671657474048e-05, + "loss": 0.7797, + "step": 3820 + }, + { + "epoch": 1.08, + "learning_rate": 2.1696431144503356e-05, + "loss": 0.8016, + "step": 3830 + }, + { + "epoch": 1.09, + "learning_rate": 2.1586255971815738e-05, + "loss": 0.7962, + "step": 3840 + }, + { + "epoch": 1.09, + "learning_rate": 2.147614831853239e-05, + "loss": 0.7897, + "step": 3850 + }, + { + "epoch": 1.09, + "learning_rate": 2.136611036243908e-05, + "loss": 0.7951, + "step": 3860 + }, + { + "epoch": 1.1, + "learning_rate": 2.1256144279943066e-05, + "loss": 0.7856, + "step": 3870 + }, + { + "epoch": 1.1, + "learning_rate": 2.114625224603002e-05, + "loss": 0.7823, + "step": 3880 + }, + { + "epoch": 1.1, + "learning_rate": 2.1036436434221048e-05, + "loss": 0.8101, + "step": 3890 + }, + { + "epoch": 1.1, + "learning_rate": 2.0926699016529656e-05, + "loss": 0.7789, + "step": 3900 + }, + { + "epoch": 1.11, + "learning_rate": 2.0817042163418858e-05, + "loss": 0.7993, + "step": 3910 + }, + { + "epoch": 1.11, + "learning_rate": 2.0707468043758156e-05, + "loss": 0.8107, + "step": 3920 + }, + { + "epoch": 1.11, + "learning_rate": 2.059797882478074e-05, + "loss": 0.8005, + "step": 3930 + }, + { + "epoch": 1.12, + "learning_rate": 2.048857667204053e-05, + "loss": 0.8144, + "step": 3940 + }, + { + "epoch": 1.12, + "learning_rate": 2.0379263749369434e-05, + "loss": 0.7894, + "step": 3950 + }, + { + "epoch": 1.12, + "learning_rate": 2.027004221883447e-05, + "loss": 0.7763, + "step": 3960 + }, + { + "epoch": 1.12, + "learning_rate": 2.016091424069506e-05, + "loss": 0.781, + "step": 3970 + }, + { + "epoch": 1.13, + "learning_rate": 2.0051881973360266e-05, + "loss": 0.7878, + "step": 3980 + }, + { + "epoch": 1.13, + "learning_rate": 1.9942947573346133e-05, + "loss": 0.7956, + "step": 3990 + }, + { + "epoch": 1.13, + "learning_rate": 1.9834113195233e-05, + "loss": 0.8036, + "step": 4000 + }, + { + "epoch": 1.14, + "learning_rate": 1.9725380991622923e-05, + "loss": 0.7945, + "step": 4010 + }, + { + "epoch": 1.14, + "learning_rate": 1.961675311309705e-05, + "loss": 0.7955, + "step": 4020 + }, + { + "epoch": 1.14, + "learning_rate": 1.9508231708173146e-05, + "loss": 0.7772, + "step": 4030 + }, + { + "epoch": 1.14, + "learning_rate": 1.9399818923263056e-05, + "loss": 0.7805, + "step": 4040 + }, + { + "epoch": 1.15, + "learning_rate": 1.929151690263026e-05, + "loss": 0.798, + "step": 4050 + }, + { + "epoch": 1.15, + "learning_rate": 1.918332778834745e-05, + "loss": 0.8183, + "step": 4060 + }, + { + "epoch": 1.15, + "learning_rate": 1.9075253720254217e-05, + "loss": 0.8106, + "step": 4070 + }, + { + "epoch": 1.16, + "learning_rate": 1.8967296835914643e-05, + "loss": 0.7918, + "step": 4080 + }, + { + "epoch": 1.16, + "learning_rate": 1.885945927057511e-05, + "loss": 0.779, + "step": 4090 + }, + { + "epoch": 1.16, + "learning_rate": 1.8751743157122003e-05, + "loss": 0.7881, + "step": 4100 + }, + { + "epoch": 1.16, + "learning_rate": 1.8644150626039534e-05, + "loss": 0.7952, + "step": 4110 + }, + { + "epoch": 1.17, + "learning_rate": 1.8536683805367656e-05, + "loss": 0.7971, + "step": 4120 + }, + { + "epoch": 1.17, + "learning_rate": 1.8429344820659892e-05, + "loss": 0.8005, + "step": 4130 + }, + { + "epoch": 1.17, + "learning_rate": 1.832213579494137e-05, + "loss": 0.8014, + "step": 4140 + }, + { + "epoch": 1.17, + "learning_rate": 1.8215058848666765e-05, + "loss": 0.7883, + "step": 4150 + }, + { + "epoch": 1.18, + "learning_rate": 1.810811609967844e-05, + "loss": 0.7887, + "step": 4160 + }, + { + "epoch": 1.18, + "learning_rate": 1.8001309663164457e-05, + "loss": 0.7719, + "step": 4170 + }, + { + "epoch": 1.18, + "learning_rate": 1.7894641651616838e-05, + "loss": 0.8098, + "step": 4180 + }, + { + "epoch": 1.19, + "learning_rate": 1.7788114174789706e-05, + "loss": 0.7909, + "step": 4190 + }, + { + "epoch": 1.19, + "learning_rate": 1.7681729339657626e-05, + "loss": 0.7791, + "step": 4200 + }, + { + "epoch": 1.19, + "learning_rate": 1.7575489250373867e-05, + "loss": 0.7946, + "step": 4210 + }, + { + "epoch": 1.19, + "learning_rate": 1.746939600822883e-05, + "loss": 0.7973, + "step": 4220 + }, + { + "epoch": 1.2, + "learning_rate": 1.7363451711608445e-05, + "loss": 0.7961, + "step": 4230 + }, + { + "epoch": 1.2, + "learning_rate": 1.7257658455952747e-05, + "loss": 0.797, + "step": 4240 + }, + { + "epoch": 1.2, + "learning_rate": 1.715201833371432e-05, + "loss": 0.7961, + "step": 4250 + }, + { + "epoch": 1.21, + "learning_rate": 1.7046533434317008e-05, + "loss": 0.7918, + "step": 4260 + }, + { + "epoch": 1.21, + "learning_rate": 1.6941205844114522e-05, + "loss": 0.7868, + "step": 4270 + }, + { + "epoch": 1.21, + "learning_rate": 1.683603764634923e-05, + "loss": 0.7843, + "step": 4280 + }, + { + "epoch": 1.21, + "learning_rate": 1.6731030921110903e-05, + "loss": 0.7968, + "step": 4290 + }, + { + "epoch": 1.22, + "learning_rate": 1.6626187745295608e-05, + "loss": 0.7917, + "step": 4300 + }, + { + "epoch": 1.22, + "learning_rate": 1.65215101925646e-05, + "loss": 0.7872, + "step": 4310 + }, + { + "epoch": 1.22, + "learning_rate": 1.641700033330336e-05, + "loss": 0.777, + "step": 4320 + }, + { + "epoch": 1.23, + "learning_rate": 1.6312660234580585e-05, + "loss": 0.8049, + "step": 4330 + }, + { + "epoch": 1.23, + "learning_rate": 1.6208491960107324e-05, + "loss": 0.7897, + "step": 4340 + }, + { + "epoch": 1.23, + "learning_rate": 1.6104497570196193e-05, + "loss": 0.792, + "step": 4350 + }, + { + "epoch": 1.23, + "learning_rate": 1.600067912172057e-05, + "loss": 0.7866, + "step": 4360 + }, + { + "epoch": 1.24, + "learning_rate": 1.5897038668073965e-05, + "loss": 0.8061, + "step": 4370 + }, + { + "epoch": 1.24, + "learning_rate": 1.5793578259129355e-05, + "loss": 0.777, + "step": 4380 + }, + { + "epoch": 1.24, + "learning_rate": 1.5690299941198706e-05, + "loss": 0.7883, + "step": 4390 + }, + { + "epoch": 1.25, + "learning_rate": 1.558720575699242e-05, + "loss": 0.7897, + "step": 4400 + }, + { + "epoch": 1.25, + "learning_rate": 1.548429774557901e-05, + "loss": 0.8014, + "step": 4410 + }, + { + "epoch": 1.25, + "learning_rate": 1.5381577942344688e-05, + "loss": 0.7882, + "step": 4420 + }, + { + "epoch": 1.25, + "learning_rate": 1.5279048378953222e-05, + "loss": 0.7839, + "step": 4430 + }, + { + "epoch": 1.26, + "learning_rate": 1.517671108330561e-05, + "loss": 0.794, + "step": 4440 + }, + { + "epoch": 1.26, + "learning_rate": 1.5074568079500109e-05, + "loss": 0.7739, + "step": 4450 + }, + { + "epoch": 1.26, + "learning_rate": 1.497262138779208e-05, + "loss": 0.7911, + "step": 4460 + }, + { + "epoch": 1.27, + "learning_rate": 1.4870873024554138e-05, + "loss": 0.7907, + "step": 4470 + }, + { + "epoch": 1.27, + "learning_rate": 1.4769325002236183e-05, + "loss": 0.803, + "step": 4480 + }, + { + "epoch": 1.27, + "learning_rate": 1.4667979329325651e-05, + "loss": 0.8048, + "step": 4490 + }, + { + "epoch": 1.27, + "learning_rate": 1.4566838010307754e-05, + "loss": 0.7816, + "step": 4500 + }, + { + "epoch": 1.28, + "learning_rate": 1.4465903045625878e-05, + "loss": 0.7765, + "step": 4510 + }, + { + "epoch": 1.28, + "learning_rate": 1.4365176431641958e-05, + "loss": 0.7916, + "step": 4520 + }, + { + "epoch": 1.28, + "learning_rate": 1.4264660160597057e-05, + "loss": 0.8015, + "step": 4530 + }, + { + "epoch": 1.29, + "learning_rate": 1.41643562205719e-05, + "loss": 0.7826, + "step": 4540 + }, + { + "epoch": 1.29, + "learning_rate": 1.4064266595447584e-05, + "loss": 0.7834, + "step": 4550 + }, + { + "epoch": 1.29, + "learning_rate": 1.3964393264866368e-05, + "loss": 0.7873, + "step": 4560 + }, + { + "epoch": 1.29, + "learning_rate": 1.386473820419244e-05, + "loss": 0.8033, + "step": 4570 + }, + { + "epoch": 1.3, + "learning_rate": 1.376530338447294e-05, + "loss": 0.7973, + "step": 4580 + }, + { + "epoch": 1.3, + "learning_rate": 1.366609077239889e-05, + "loss": 0.7736, + "step": 4590 + }, + { + "epoch": 1.3, + "learning_rate": 1.3567102330266369e-05, + "loss": 0.7968, + "step": 4600 + }, + { + "epoch": 1.31, + "learning_rate": 1.3468340015937642e-05, + "loss": 0.7773, + "step": 4610 + }, + { + "epoch": 1.31, + "learning_rate": 1.3369805782802467e-05, + "loss": 0.7971, + "step": 4620 + }, + { + "epoch": 1.31, + "learning_rate": 1.3271501579739449e-05, + "loss": 0.7808, + "step": 4630 + }, + { + "epoch": 1.31, + "learning_rate": 1.317342935107752e-05, + "loss": 0.7826, + "step": 4640 + }, + { + "epoch": 1.32, + "learning_rate": 1.307559103655743e-05, + "loss": 0.7767, + "step": 4650 + }, + { + "epoch": 1.32, + "learning_rate": 1.2977988571293447e-05, + "loss": 0.7962, + "step": 4660 + }, + { + "epoch": 1.32, + "learning_rate": 1.288062388573501e-05, + "loss": 0.7876, + "step": 4670 + }, + { + "epoch": 1.33, + "learning_rate": 1.2783498905628622e-05, + "loss": 0.782, + "step": 4680 + }, + { + "epoch": 1.33, + "learning_rate": 1.2686615551979702e-05, + "loss": 0.7926, + "step": 4690 + }, + { + "epoch": 1.33, + "learning_rate": 1.2589975741014615e-05, + "loss": 0.7939, + "step": 4700 + }, + { + "epoch": 1.33, + "learning_rate": 1.2493581384142767e-05, + "loss": 0.7992, + "step": 4710 + }, + { + "epoch": 1.34, + "learning_rate": 1.2397434387918824e-05, + "loss": 0.7766, + "step": 4720 + }, + { + "epoch": 1.34, + "learning_rate": 1.2301536654004948e-05, + "loss": 0.7887, + "step": 4730 + }, + { + "epoch": 1.34, + "learning_rate": 1.2205890079133252e-05, + "loss": 0.7927, + "step": 4740 + }, + { + "epoch": 1.34, + "learning_rate": 1.2110496555068218e-05, + "loss": 0.786, + "step": 4750 + }, + { + "epoch": 1.35, + "learning_rate": 1.2015357968569335e-05, + "loss": 0.7821, + "step": 4760 + }, + { + "epoch": 1.35, + "learning_rate": 1.1920476201353763e-05, + "loss": 0.7864, + "step": 4770 + }, + { + "epoch": 1.35, + "learning_rate": 1.1825853130059098e-05, + "loss": 0.7888, + "step": 4780 + }, + { + "epoch": 1.36, + "learning_rate": 1.1731490626206263e-05, + "loss": 0.794, + "step": 4790 + }, + { + "epoch": 1.36, + "learning_rate": 1.16373905561625e-05, + "loss": 0.771, + "step": 4800 + }, + { + "epoch": 1.36, + "learning_rate": 1.1543554781104477e-05, + "loss": 0.7984, + "step": 4810 + }, + { + "epoch": 1.36, + "learning_rate": 1.1449985156981413e-05, + "loss": 0.7961, + "step": 4820 + }, + { + "epoch": 1.37, + "learning_rate": 1.1356683534478451e-05, + "loss": 0.7824, + "step": 4830 + }, + { + "epoch": 1.37, + "learning_rate": 1.1263651758979967e-05, + "loss": 0.7867, + "step": 4840 + }, + { + "epoch": 1.37, + "learning_rate": 1.1170891670533162e-05, + "loss": 0.787, + "step": 4850 + }, + { + "epoch": 1.38, + "learning_rate": 1.107840510381158e-05, + "loss": 0.7789, + "step": 4860 + }, + { + "epoch": 1.38, + "learning_rate": 1.0986193888078882e-05, + "loss": 0.7951, + "step": 4870 + }, + { + "epoch": 1.38, + "learning_rate": 1.0894259847152636e-05, + "loss": 0.8037, + "step": 4880 + }, + { + "epoch": 1.38, + "learning_rate": 1.0802604799368274e-05, + "loss": 0.7901, + "step": 4890 + }, + { + "epoch": 1.39, + "learning_rate": 1.0711230557543078e-05, + "loss": 0.7736, + "step": 4900 + }, + { + "epoch": 1.39, + "learning_rate": 1.0620138928940394e-05, + "loss": 0.7743, + "step": 4910 + }, + { + "epoch": 1.39, + "learning_rate": 1.0529331715233795e-05, + "loss": 0.7971, + "step": 4920 + }, + { + "epoch": 1.4, + "learning_rate": 1.0438810712471553e-05, + "loss": 0.7812, + "step": 4930 + }, + { + "epoch": 1.4, + "learning_rate": 1.0348577711041021e-05, + "loss": 0.7788, + "step": 4940 + }, + { + "epoch": 1.4, + "learning_rate": 1.0258634495633277e-05, + "loss": 0.7866, + "step": 4950 + }, + { + "epoch": 1.4, + "learning_rate": 1.0168982845207797e-05, + "loss": 0.8023, + "step": 4960 + }, + { + "epoch": 1.41, + "learning_rate": 1.0079624532957316e-05, + "loss": 0.7766, + "step": 4970 + }, + { + "epoch": 1.41, + "learning_rate": 9.99056132627267e-06, + "loss": 0.7831, + "step": 4980 + }, + { + "epoch": 1.41, + "learning_rate": 9.901794986707941e-06, + "loss": 0.7927, + "step": 4990 + }, + { + "epoch": 1.42, + "learning_rate": 9.813327269945547e-06, + "loss": 0.7852, + "step": 5000 + }, + { + "epoch": 1.42, + "learning_rate": 9.725159925761532e-06, + "loss": 0.7649, + "step": 5010 + }, + { + "epoch": 1.42, + "learning_rate": 9.637294697990961e-06, + "loss": 0.7818, + "step": 5020 + }, + { + "epoch": 1.42, + "learning_rate": 9.549733324493431e-06, + "loss": 0.7789, + "step": 5030 + }, + { + "epoch": 1.43, + "learning_rate": 9.462477537118717e-06, + "loss": 0.7636, + "step": 5040 + }, + { + "epoch": 1.43, + "learning_rate": 9.375529061672467e-06, + "loss": 0.7832, + "step": 5050 + }, + { + "epoch": 1.43, + "learning_rate": 9.288889617882136e-06, + "loss": 0.7959, + "step": 5060 + }, + { + "epoch": 1.44, + "learning_rate": 9.202560919362896e-06, + "loss": 0.7896, + "step": 5070 + }, + { + "epoch": 1.44, + "learning_rate": 9.116544673583824e-06, + "loss": 0.781, + "step": 5080 + }, + { + "epoch": 1.44, + "learning_rate": 9.030842581834062e-06, + "loss": 0.7876, + "step": 5090 + }, + { + "epoch": 1.44, + "learning_rate": 8.945456339189198e-06, + "loss": 0.7818, + "step": 5100 + }, + { + "epoch": 1.45, + "learning_rate": 8.860387634477736e-06, + "loss": 0.7851, + "step": 5110 + }, + { + "epoch": 1.45, + "learning_rate": 8.775638150247714e-06, + "loss": 0.7824, + "step": 5120 + }, + { + "epoch": 1.45, + "learning_rate": 8.691209562733371e-06, + "loss": 0.7988, + "step": 5130 + }, + { + "epoch": 1.46, + "learning_rate": 8.607103541822068e-06, + "loss": 0.7771, + "step": 5140 + }, + { + "epoch": 1.46, + "learning_rate": 8.523321751021176e-06, + "loss": 0.7888, + "step": 5150 + }, + { + "epoch": 1.46, + "learning_rate": 8.43986584742526e-06, + "loss": 0.794, + "step": 5160 + }, + { + "epoch": 1.46, + "learning_rate": 8.35673748168323e-06, + "loss": 0.7854, + "step": 5170 + }, + { + "epoch": 1.47, + "learning_rate": 8.273938297965736e-06, + "loss": 0.7927, + "step": 5180 + }, + { + "epoch": 1.47, + "learning_rate": 8.191469933932625e-06, + "loss": 0.801, + "step": 5190 + }, + { + "epoch": 1.47, + "learning_rate": 8.109334020700591e-06, + "loss": 0.7816, + "step": 5200 + }, + { + "epoch": 1.48, + "learning_rate": 8.027532182810845e-06, + "loss": 0.7912, + "step": 5210 + }, + { + "epoch": 1.48, + "learning_rate": 7.946066038197065e-06, + "loss": 0.7818, + "step": 5220 + }, + { + "epoch": 1.48, + "learning_rate": 7.86493719815333e-06, + "loss": 0.7833, + "step": 5230 + }, + { + "epoch": 1.48, + "learning_rate": 7.784147267302274e-06, + "loss": 0.7919, + "step": 5240 + }, + { + "epoch": 1.49, + "learning_rate": 7.70369784356336e-06, + "loss": 0.771, + "step": 5250 + }, + { + "epoch": 1.49, + "learning_rate": 7.62359051812124e-06, + "loss": 0.7887, + "step": 5260 + }, + { + "epoch": 1.49, + "learning_rate": 7.543826875394347e-06, + "loss": 0.7744, + "step": 5270 + }, + { + "epoch": 1.49, + "learning_rate": 7.464408493003483e-06, + "loss": 0.7887, + "step": 5280 + }, + { + "epoch": 1.5, + "learning_rate": 7.385336941740678e-06, + "loss": 0.7638, + "step": 5290 + }, + { + "epoch": 1.5, + "learning_rate": 7.306613785538066e-06, + "loss": 0.7778, + "step": 5300 + }, + { + "epoch": 1.5, + "learning_rate": 7.2282405814370125e-06, + "loss": 0.7769, + "step": 5310 + }, + { + "epoch": 1.51, + "learning_rate": 7.150218879557263e-06, + "loss": 0.7916, + "step": 5320 + }, + { + "epoch": 1.51, + "learning_rate": 7.072550223066321e-06, + "loss": 0.7798, + "step": 5330 + }, + { + "epoch": 1.51, + "learning_rate": 6.9952361481488896e-06, + "loss": 0.7733, + "step": 5340 + }, + { + "epoch": 1.51, + "learning_rate": 6.918278183976554e-06, + "loss": 0.7701, + "step": 5350 + }, + { + "epoch": 1.52, + "learning_rate": 6.841677852677447e-06, + "loss": 0.7792, + "step": 5360 + }, + { + "epoch": 1.52, + "learning_rate": 6.765436669306227e-06, + "loss": 0.7863, + "step": 5370 + }, + { + "epoch": 1.52, + "learning_rate": 6.689556141814043e-06, + "loss": 0.7821, + "step": 5380 + }, + { + "epoch": 1.53, + "learning_rate": 6.614037771018775e-06, + "loss": 0.7896, + "step": 5390 + }, + { + "epoch": 1.53, + "learning_rate": 6.538883050575284e-06, + "loss": 0.7943, + "step": 5400 + }, + { + "epoch": 1.53, + "learning_rate": 6.464093466945919e-06, + "loss": 0.7933, + "step": 5410 + }, + { + "epoch": 1.53, + "learning_rate": 6.389670499371089e-06, + "loss": 0.7773, + "step": 5420 + }, + { + "epoch": 1.54, + "learning_rate": 6.3156156198400315e-06, + "loss": 0.7828, + "step": 5430 + }, + { + "epoch": 1.54, + "learning_rate": 6.241930293061662e-06, + "loss": 0.7769, + "step": 5440 + }, + { + "epoch": 1.54, + "learning_rate": 6.16861597643564e-06, + "loss": 0.7726, + "step": 5450 + }, + { + "epoch": 1.55, + "learning_rate": 6.0956741200235315e-06, + "loss": 0.7956, + "step": 5460 + }, + { + "epoch": 1.55, + "learning_rate": 6.023106166520104e-06, + "loss": 0.7932, + "step": 5470 + }, + { + "epoch": 1.55, + "learning_rate": 5.950913551224838e-06, + "loss": 0.7849, + "step": 5480 + }, + { + "epoch": 1.55, + "learning_rate": 5.879097702013495e-06, + "loss": 0.7968, + "step": 5490 + }, + { + "epoch": 1.56, + "learning_rate": 5.807660039309904e-06, + "loss": 0.7827, + "step": 5500 + }, + { + "epoch": 1.56, + "learning_rate": 5.736601976057848e-06, + "loss": 0.791, + "step": 5510 + }, + { + "epoch": 1.56, + "learning_rate": 5.66592491769315e-06, + "loss": 0.7792, + "step": 5520 + }, + { + "epoch": 1.57, + "learning_rate": 5.595630262115825e-06, + "loss": 0.7808, + "step": 5530 + }, + { + "epoch": 1.57, + "learning_rate": 5.525719399662488e-06, + "loss": 0.7723, + "step": 5540 + }, + { + "epoch": 1.57, + "learning_rate": 5.456193713078797e-06, + "loss": 0.7789, + "step": 5550 + }, + { + "epoch": 1.57, + "learning_rate": 5.387054577492165e-06, + "loss": 0.7903, + "step": 5560 + }, + { + "epoch": 1.58, + "learning_rate": 5.318303360384508e-06, + "loss": 0.7801, + "step": 5570 + }, + { + "epoch": 1.58, + "learning_rate": 5.249941421565227e-06, + "loss": 0.7733, + "step": 5580 + }, + { + "epoch": 1.58, + "learning_rate": 5.181970113144296e-06, + "loss": 0.7891, + "step": 5590 + }, + { + "epoch": 1.59, + "learning_rate": 5.114390779505557e-06, + "loss": 0.7912, + "step": 5600 + }, + { + "epoch": 1.59, + "learning_rate": 5.047204757280072e-06, + "loss": 0.7917, + "step": 5610 + }, + { + "epoch": 1.59, + "learning_rate": 4.980413375319737e-06, + "loss": 0.7922, + "step": 5620 + }, + { + "epoch": 1.59, + "learning_rate": 4.914017954670961e-06, + "loss": 0.79, + "step": 5630 + }, + { + "epoch": 1.6, + "learning_rate": 4.8480198085485765e-06, + "loss": 0.7844, + "step": 5640 + }, + { + "epoch": 1.6, + "learning_rate": 4.782420242309821e-06, + "loss": 0.7855, + "step": 5650 + }, + { + "epoch": 1.6, + "learning_rate": 4.717220553428559e-06, + "loss": 0.779, + "step": 5660 + }, + { + "epoch": 1.61, + "learning_rate": 4.652422031469583e-06, + "loss": 0.7864, + "step": 5670 + }, + { + "epoch": 1.61, + "learning_rate": 4.58802595806315e-06, + "loss": 0.7802, + "step": 5680 + }, + { + "epoch": 1.61, + "learning_rate": 4.524033606879602e-06, + "loss": 0.7776, + "step": 5690 + }, + { + "epoch": 1.61, + "learning_rate": 4.460446243604169e-06, + "loss": 0.778, + "step": 5700 + }, + { + "epoch": 1.62, + "learning_rate": 4.3972651259119706e-06, + "loss": 0.7834, + "step": 5710 + }, + { + "epoch": 1.62, + "learning_rate": 4.3344915034431e-06, + "loss": 0.7875, + "step": 5720 + }, + { + "epoch": 1.62, + "learning_rate": 4.272126617777933e-06, + "loss": 0.787, + "step": 5730 + }, + { + "epoch": 1.63, + "learning_rate": 4.2101717024125576e-06, + "loss": 0.7773, + "step": 5740 + }, + { + "epoch": 1.63, + "learning_rate": 4.148627982734404e-06, + "loss": 0.7853, + "step": 5750 + }, + { + "epoch": 1.63, + "learning_rate": 4.087496675997965e-06, + "loss": 0.7917, + "step": 5760 + }, + { + "epoch": 1.63, + "learning_rate": 4.026778991300762e-06, + "loss": 0.7907, + "step": 5770 + }, + { + "epoch": 1.64, + "learning_rate": 3.966476129559391e-06, + "loss": 0.7764, + "step": 5780 + }, + { + "epoch": 1.64, + "learning_rate": 3.90658928348582e-06, + "loss": 0.7718, + "step": 5790 + }, + { + "epoch": 1.64, + "learning_rate": 3.847119637563739e-06, + "loss": 0.791, + "step": 5800 + }, + { + "epoch": 1.64, + "learning_rate": 3.7880683680251855e-06, + "loss": 0.7732, + "step": 5810 + }, + { + "epoch": 1.65, + "learning_rate": 3.7294366428272386e-06, + "loss": 0.7621, + "step": 5820 + }, + { + "epoch": 1.65, + "learning_rate": 3.6712256216289624e-06, + "loss": 0.7619, + "step": 5830 + }, + { + "epoch": 1.65, + "learning_rate": 3.613436455768418e-06, + "loss": 0.782, + "step": 5840 + }, + { + "epoch": 1.66, + "learning_rate": 3.5560702882399406e-06, + "loss": 0.7853, + "step": 5850 + }, + { + "epoch": 1.66, + "learning_rate": 3.499128253671494e-06, + "loss": 0.7896, + "step": 5860 + }, + { + "epoch": 1.66, + "learning_rate": 3.4426114783022546e-06, + "loss": 0.7939, + "step": 5870 + }, + { + "epoch": 1.66, + "learning_rate": 3.3865210799603253e-06, + "loss": 0.7734, + "step": 5880 + }, + { + "epoch": 1.67, + "learning_rate": 3.3308581680406182e-06, + "loss": 0.7951, + "step": 5890 + }, + { + "epoch": 1.67, + "learning_rate": 3.275623843482939e-06, + "loss": 0.7892, + "step": 5900 + }, + { + "epoch": 1.67, + "learning_rate": 3.220819198750172e-06, + "loss": 0.7788, + "step": 5910 + }, + { + "epoch": 1.68, + "learning_rate": 3.166445317806721e-06, + "loss": 0.8137, + "step": 5920 + }, + { + "epoch": 1.68, + "learning_rate": 3.1125032760970203e-06, + "loss": 0.7665, + "step": 5930 + }, + { + "epoch": 1.68, + "learning_rate": 3.0589941405243043e-06, + "loss": 0.7812, + "step": 5940 + }, + { + "epoch": 1.68, + "learning_rate": 3.0059189694294774e-06, + "loss": 0.7824, + "step": 5950 + }, + { + "epoch": 1.69, + "learning_rate": 2.953278812570201e-06, + "loss": 0.7736, + "step": 5960 + }, + { + "epoch": 1.69, + "learning_rate": 2.9010747111001103e-06, + "loss": 0.7759, + "step": 5970 + }, + { + "epoch": 1.69, + "learning_rate": 2.849307697548251e-06, + "loss": 0.7946, + "step": 5980 + }, + { + "epoch": 1.7, + "learning_rate": 2.7979787957986225e-06, + "loss": 0.7938, + "step": 5990 + }, + { + "epoch": 1.7, + "learning_rate": 2.7470890210699596e-06, + "loss": 0.7818, + "step": 6000 + }, + { + "epoch": 1.7, + "learning_rate": 2.6966393798956242e-06, + "loss": 0.7773, + "step": 6010 + }, + { + "epoch": 1.7, + "learning_rate": 2.6466308701037253e-06, + "loss": 0.7779, + "step": 6020 + }, + { + "epoch": 1.71, + "learning_rate": 2.597064480797351e-06, + "loss": 0.7981, + "step": 6030 + }, + { + "epoch": 1.71, + "learning_rate": 2.547941192335035e-06, + "loss": 0.7881, + "step": 6040 + }, + { + "epoch": 1.71, + "learning_rate": 2.4992619763113427e-06, + "loss": 0.7772, + "step": 6050 + }, + { + "epoch": 1.72, + "learning_rate": 2.4510277955376885e-06, + "loss": 0.7812, + "step": 6060 + }, + { + "epoch": 1.72, + "learning_rate": 2.403239604023244e-06, + "loss": 0.7753, + "step": 6070 + }, + { + "epoch": 1.72, + "learning_rate": 2.360612333857401e-06, + "loss": 0.7778, + "step": 6080 + }, + { + "epoch": 1.72, + "learning_rate": 2.31367411862298e-06, + "loss": 0.7883, + "step": 6090 + }, + { + "epoch": 1.73, + "learning_rate": 2.2671846093243493e-06, + "loss": 0.7885, + "step": 6100 + }, + { + "epoch": 1.73, + "learning_rate": 2.221144725463359e-06, + "loss": 0.7876, + "step": 6110 + }, + { + "epoch": 1.73, + "learning_rate": 2.1755553776488745e-06, + "loss": 0.8012, + "step": 6120 + }, + { + "epoch": 1.74, + "learning_rate": 2.130417467578724e-06, + "loss": 0.7967, + "step": 6130 + }, + { + "epoch": 1.74, + "learning_rate": 2.0857318880218995e-06, + "loss": 0.7827, + "step": 6140 + }, + { + "epoch": 1.74, + "learning_rate": 2.0414995228008743e-06, + "loss": 0.7657, + "step": 6150 + }, + { + "epoch": 1.74, + "learning_rate": 1.997721246774145e-06, + "loss": 0.7655, + "step": 6160 + }, + { + "epoch": 1.75, + "learning_rate": 1.9543979258189126e-06, + "loss": 0.7713, + "step": 6170 + }, + { + "epoch": 1.75, + "learning_rate": 1.911530416813953e-06, + "loss": 0.7871, + "step": 6180 + }, + { + "epoch": 1.75, + "learning_rate": 1.869119567622679e-06, + "loss": 0.7983, + "step": 6190 + }, + { + "epoch": 1.76, + "learning_rate": 1.8271662170763787e-06, + "loss": 0.8057, + "step": 6200 + }, + { + "epoch": 1.76, + "learning_rate": 1.7856711949575972e-06, + "loss": 0.7798, + "step": 6210 + }, + { + "epoch": 1.76, + "learning_rate": 1.7446353219837592e-06, + "loss": 0.7845, + "step": 6220 + }, + { + "epoch": 1.76, + "learning_rate": 1.704059409790898e-06, + "loss": 0.7907, + "step": 6230 + }, + { + "epoch": 1.77, + "learning_rate": 1.6639442609176409e-06, + "loss": 0.778, + "step": 6240 + }, + { + "epoch": 1.77, + "learning_rate": 1.6242906687893077e-06, + "loss": 0.7924, + "step": 6250 + }, + { + "epoch": 1.77, + "learning_rate": 1.5850994177022265e-06, + "loss": 0.7988, + "step": 6260 + }, + { + "epoch": 1.78, + "learning_rate": 1.546371282808226e-06, + "loss": 0.7741, + "step": 6270 + }, + { + "epoch": 1.78, + "learning_rate": 1.508107030099304e-06, + "loss": 0.7944, + "step": 6280 + }, + { + "epoch": 1.78, + "learning_rate": 1.4703074163924718e-06, + "loss": 0.7845, + "step": 6290 + }, + { + "epoch": 1.78, + "learning_rate": 1.4329731893147792e-06, + "loss": 0.7832, + "step": 6300 + }, + { + "epoch": 1.79, + "learning_rate": 1.396105087288549e-06, + "loss": 0.7933, + "step": 6310 + }, + { + "epoch": 1.79, + "learning_rate": 1.3597038395167516e-06, + "loss": 0.7803, + "step": 6320 + }, + { + "epoch": 1.79, + "learning_rate": 1.3237701659685854e-06, + "loss": 0.7794, + "step": 6330 + }, + { + "epoch": 1.8, + "learning_rate": 1.28830477736524e-06, + "loss": 0.7715, + "step": 6340 + }, + { + "epoch": 1.8, + "learning_rate": 1.253308375165857e-06, + "loss": 0.7918, + "step": 6350 + }, + { + "epoch": 1.8, + "learning_rate": 1.2187816515536105e-06, + "loss": 0.7829, + "step": 6360 + }, + { + "epoch": 1.8, + "learning_rate": 1.184725289422073e-06, + "loss": 0.7932, + "step": 6370 + }, + { + "epoch": 1.81, + "learning_rate": 1.151139962361658e-06, + "loss": 0.7838, + "step": 6380 + }, + { + "epoch": 1.81, + "learning_rate": 1.1180263346463327e-06, + "loss": 0.7767, + "step": 6390 + }, + { + "epoch": 1.81, + "learning_rate": 1.0853850612204646e-06, + "loss": 0.7757, + "step": 6400 + }, + { + "epoch": 1.81, + "learning_rate": 1.053216787685865e-06, + "loss": 0.779, + "step": 6410 + }, + { + "epoch": 1.82, + "learning_rate": 1.0215221502890254e-06, + "loss": 0.7789, + "step": 6420 + }, + { + "epoch": 1.82, + "learning_rate": 9.903017759085365e-07, + "loss": 0.7738, + "step": 6430 + }, + { + "epoch": 1.82, + "learning_rate": 9.595562820426758e-07, + "loss": 0.7873, + "step": 6440 + }, + { + "epoch": 1.83, + "learning_rate": 9.292862767972199e-07, + "loss": 0.7923, + "step": 6450 + }, + { + "epoch": 1.83, + "learning_rate": 8.994923588733856e-07, + "loss": 0.7888, + "step": 6460 + }, + { + "epoch": 1.83, + "learning_rate": 8.701751175560102e-07, + "loss": 0.7749, + "step": 6470 + }, + { + "epoch": 1.83, + "learning_rate": 8.41335132701887e-07, + "loss": 0.7706, + "step": 6480 + }, + { + "epoch": 1.84, + "learning_rate": 8.129729747283016e-07, + "loss": 0.7896, + "step": 6490 + }, + { + "epoch": 1.84, + "learning_rate": 7.85089204601741e-07, + "loss": 0.7918, + "step": 6500 + }, + { + "epoch": 1.84, + "learning_rate": 7.576843738268113e-07, + "loss": 0.7875, + "step": 6510 + }, + { + "epoch": 1.85, + "learning_rate": 7.307590244353263e-07, + "loss": 0.7871, + "step": 6520 + }, + { + "epoch": 1.85, + "learning_rate": 7.043136889755691e-07, + "loss": 0.7734, + "step": 6530 + }, + { + "epoch": 1.85, + "learning_rate": 6.783488905017871e-07, + "loss": 0.7856, + "step": 6540 + }, + { + "epoch": 1.85, + "learning_rate": 6.528651425638272e-07, + "loss": 0.7964, + "step": 6550 + }, + { + "epoch": 1.86, + "learning_rate": 6.278629491969862e-07, + "loss": 0.778, + "step": 6560 + }, + { + "epoch": 1.86, + "learning_rate": 6.033428049120326e-07, + "loss": 0.7914, + "step": 6570 + }, + { + "epoch": 1.86, + "learning_rate": 5.793051946854422e-07, + "loss": 0.7691, + "step": 6580 + }, + { + "epoch": 1.87, + "learning_rate": 5.557505939497915e-07, + "loss": 0.7893, + "step": 6590 + }, + { + "epoch": 1.87, + "learning_rate": 5.326794685843655e-07, + "loss": 0.7833, + "step": 6600 + }, + { + "epoch": 1.87, + "learning_rate": 5.100922749059239e-07, + "loss": 0.7903, + "step": 6610 + }, + { + "epoch": 1.87, + "learning_rate": 4.879894596597018e-07, + "loss": 0.7683, + "step": 6620 + }, + { + "epoch": 1.88, + "learning_rate": 4.663714600105534e-07, + "loss": 0.7717, + "step": 6630 + }, + { + "epoch": 1.88, + "learning_rate": 4.452387035343203e-07, + "loss": 0.7876, + "step": 6640 + }, + { + "epoch": 1.88, + "learning_rate": 4.2459160820935153e-07, + "loss": 0.7888, + "step": 6650 + }, + { + "epoch": 1.89, + "learning_rate": 4.044305824082717e-07, + "loss": 0.7729, + "step": 6660 + }, + { + "epoch": 1.89, + "learning_rate": 3.84756024889868e-07, + "loss": 0.7824, + "step": 6670 + }, + { + "epoch": 1.89, + "learning_rate": 3.6556832479123504e-07, + "loss": 0.7662, + "step": 6680 + }, + { + "epoch": 1.89, + "learning_rate": 3.468678616200427e-07, + "loss": 0.7981, + "step": 6690 + }, + { + "epoch": 1.9, + "learning_rate": 3.2865500524707217e-07, + "loss": 0.7806, + "step": 6700 + }, + { + "epoch": 1.9, + "learning_rate": 3.109301158988609e-07, + "loss": 0.7858, + "step": 6710 + }, + { + "epoch": 1.9, + "learning_rate": 2.936935441506028e-07, + "loss": 0.7827, + "step": 6720 + }, + { + "epoch": 1.91, + "learning_rate": 2.769456309192037e-07, + "loss": 0.7784, + "step": 6730 + }, + { + "epoch": 1.91, + "learning_rate": 2.6068670745654224e-07, + "loss": 0.7761, + "step": 6740 + }, + { + "epoch": 1.91, + "learning_rate": 2.449170953429225e-07, + "loss": 0.7732, + "step": 6750 + }, + { + "epoch": 1.91, + "learning_rate": 2.296371064806957e-07, + "loss": 0.7899, + "step": 6760 + }, + { + "epoch": 1.92, + "learning_rate": 2.1484704308812053e-07, + "loss": 0.7839, + "step": 6770 + }, + { + "epoch": 1.92, + "learning_rate": 2.0054719769335428e-07, + "loss": 0.7831, + "step": 6780 + }, + { + "epoch": 1.92, + "learning_rate": 1.8673785312869063e-07, + "loss": 0.7817, + "step": 6790 + }, + { + "epoch": 1.93, + "learning_rate": 1.7341928252495033e-07, + "loss": 0.792, + "step": 6800 + }, + { + "epoch": 1.93, + "learning_rate": 1.60591749306091e-07, + "loss": 0.7942, + "step": 6810 + }, + { + "epoch": 1.93, + "learning_rate": 1.4825550718398362e-07, + "loss": 0.7607, + "step": 6820 + }, + { + "epoch": 1.93, + "learning_rate": 1.3641080015341369e-07, + "loss": 0.7743, + "step": 6830 + }, + { + "epoch": 1.94, + "learning_rate": 1.2505786248723229e-07, + "loss": 0.763, + "step": 6840 + }, + { + "epoch": 1.94, + "learning_rate": 1.1419691873174043e-07, + "loss": 0.7685, + "step": 6850 + }, + { + "epoch": 1.94, + "learning_rate": 1.038281837022398e-07, + "loss": 0.7773, + "step": 6860 + }, + { + "epoch": 1.95, + "learning_rate": 9.395186247878329e-08, + "loss": 0.7663, + "step": 6870 + }, + { + "epoch": 1.95, + "learning_rate": 8.456815040212562e-08, + "loss": 0.7769, + "step": 6880 + }, + { + "epoch": 1.95, + "learning_rate": 7.567723306984853e-08, + "loss": 0.7921, + "step": 6890 + }, + { + "epoch": 1.95, + "learning_rate": 6.727928633270264e-08, + "loss": 0.7877, + "step": 6900 + }, + { + "epoch": 1.96, + "learning_rate": 5.937447629112414e-08, + "loss": 0.7709, + "step": 6910 + }, + { + "epoch": 1.96, + "learning_rate": 5.196295929193739e-08, + "loss": 0.7921, + "step": 6920 + }, + { + "epoch": 1.96, + "learning_rate": 4.5044881925287994e-08, + "loss": 0.7707, + "step": 6930 + }, + { + "epoch": 1.96, + "learning_rate": 3.862038102172283e-08, + "loss": 0.7752, + "step": 6940 + }, + { + "epoch": 1.97, + "learning_rate": 3.268958364948671e-08, + "loss": 0.7728, + "step": 6950 + }, + { + "epoch": 1.97, + "learning_rate": 2.7252607112018823e-08, + "loss": 0.7651, + "step": 6960 + }, + { + "epoch": 1.97, + "learning_rate": 2.2309558945621257e-08, + "loss": 0.7892, + "step": 6970 + }, + { + "epoch": 1.98, + "learning_rate": 1.7860536917341243e-08, + "loss": 0.7671, + "step": 6980 + }, + { + "epoch": 1.98, + "learning_rate": 1.3905629023031052e-08, + "loss": 0.7767, + "step": 6990 + }, + { + "epoch": 1.98, + "learning_rate": 1.0444913485610498e-08, + "loss": 0.7847, + "step": 7000 + }, + { + "epoch": 1.98, + "learning_rate": 7.478458753518159e-09, + "loss": 0.7814, + "step": 7010 + }, + { + "epoch": 1.99, + "learning_rate": 5.006323499359699e-09, + "loss": 0.7902, + "step": 7020 + }, + { + "epoch": 1.99, + "learning_rate": 3.02855661874768e-09, + "loss": 0.7684, + "step": 7030 + }, + { + "epoch": 1.99, + "learning_rate": 1.5451972293301087e-09, + "loss": 0.7709, + "step": 7040 + }, + { + "epoch": 2.0, + "learning_rate": 5.56274670021617e-10, + "loss": 0.7924, + "step": 7050 + }, + { + "epoch": 2.0, + "learning_rate": 6.180850041781483e-11, + "loss": 0.8148, + "step": 7060 + }, + { + "epoch": 2.0, + "step": 7064, + "total_flos": 1.2677047696255615e+19, + "train_loss": 0.8239178928553991, + "train_runtime": 71865.5404, + "train_samples_per_second": 6.291, + "train_steps_per_second": 0.098 + } + ], + "max_steps": 7064, + "num_train_epochs": 2, + "total_flos": 1.2677047696255615e+19, + "trial_name": null, + "trial_params": null +} diff --git a/sft-qlora/training_args.bin b/sft-qlora/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..e8bd5ea7554270f553d5441a16ce5f0105c78887 --- /dev/null +++ b/sft-qlora/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:131cb9a8eab84a15c7b110e05a98a526550eba69b35fa4c758b43a4caafa6db7 +size 3275 diff --git a/sft-qlora/training_loss.png b/sft-qlora/training_loss.png new file mode 100644 index 0000000000000000000000000000000000000000..b87bb91e400044d36bfded84f92975bd3f482b48 Binary files /dev/null and b/sft-qlora/training_loss.png differ