thangvip commited on
Commit
614a556
·
verified ·
1 Parent(s): 7590dfb

Training in progress, step 399, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0b141baf18e509bb39df2d9729eac124c18ec0aa71d5f6467ca60c922f1bc344
3
  size 1342238560
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:509eb7625e5d72697ba45e83da0b1443902752698f83af8ab44a82770761b79b
3
  size 1342238560
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3b683f572ce53fc051b588f35612307ce9f4b76c303143dc022c654908efa664
3
  size 674092242
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:73c2a787bdf4530acd24befc2d71249593128706625caddb933a9e454e4d4dbb
3
  size 674092242
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f52035cf003523191da6704c085aea40d350a3deea0e92e91724980d5259f136
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cc6eb7f81374fe232aa541864941cc2fdba3cd1599eb1d67e6d9663327e9b062
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 1.0175165278526774,
5
  "eval_steps": 500,
6
- "global_step": 398,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -2793,6 +2793,13 @@
2793
  "learning_rate": 0.00011260997067448683,
2794
  "loss": 0.6486,
2795
  "step": 398
 
 
 
 
 
 
 
2796
  }
2797
  ],
2798
  "logging_steps": 1,
@@ -2812,7 +2819,7 @@
2812
  "attributes": {}
2813
  }
2814
  },
2815
- "total_flos": 1.2992603159361946e+18,
2816
  "train_batch_size": 2,
2817
  "trial_name": null,
2818
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 1.020073102043262,
5
  "eval_steps": 500,
6
+ "global_step": 399,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
2793
  "learning_rate": 0.00011260997067448683,
2794
  "loss": 0.6486,
2795
  "step": 398
2796
+ },
2797
+ {
2798
+ "epoch": 1.020073102043262,
2799
+ "grad_norm": 0.1075356975197792,
2800
+ "learning_rate": 0.00011231671554252199,
2801
+ "loss": 0.6775,
2802
+ "step": 399
2803
  }
2804
  ],
2805
  "logging_steps": 1,
 
2819
  "attributes": {}
2820
  }
2821
  },
2822
+ "total_flos": 1.302288297813934e+18,
2823
  "train_batch_size": 2,
2824
  "trial_name": null,
2825
  "trial_params": null