Alphatao commited on
Commit
dbce512
·
verified ·
1 Parent(s): b665d92

Training in progress, step 2, checkpoint

Browse files
last-checkpoint/adapter_config.json CHANGED
@@ -20,12 +20,12 @@
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
 
23
  "gate_proj",
24
- "k_proj",
25
  "q_proj",
26
- "up_proj",
27
- "down_proj",
28
  "v_proj",
 
 
29
  "o_proj"
30
  ],
31
  "task_type": "CAUSAL_LM",
 
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
23
+ "down_proj",
24
  "gate_proj",
 
25
  "q_proj",
 
 
26
  "v_proj",
27
+ "up_proj",
28
+ "k_proj",
29
  "o_proj"
30
  ],
31
  "task_type": "CAUSAL_LM",
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e6015c8163f1df8e22c794a249e6c00712349603742ea89cab4bca412edf7f67
3
  size 671149168
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd3281f036d04d9f5f470e3ae181a36a2a8d62bd14263758ff7b2f7275a8fefd
3
  size 671149168
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2b434b9fffdf083fb79bb4c69340230d1cc690041651fbf48e304454dee1ec24
3
  size 341314196
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bb2aefcd8a898c389afd5016fecc88116ad90317cf7b34a872246179f50b5304
3
  size 341314196
last-checkpoint/trainer_state.json CHANGED
@@ -10,7 +10,7 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.0002717883674578728,
13
- "grad_norm": 4.489199161529541,
14
  "learning_rate": 2e-05,
15
  "loss": 5.3201,
16
  "step": 1
@@ -18,14 +18,14 @@
18
  {
19
  "epoch": 0.0002717883674578728,
20
  "eval_loss": 5.817660331726074,
21
- "eval_runtime": 742.2088,
22
- "eval_samples_per_second": 6.262,
23
- "eval_steps_per_second": 1.566,
24
  "step": 1
25
  },
26
  {
27
  "epoch": 0.0005435767349157456,
28
- "grad_norm": 7.107272624969482,
29
  "learning_rate": 4e-05,
30
  "loss": 5.8911,
31
  "step": 2
 
10
  "log_history": [
11
  {
12
  "epoch": 0.0002717883674578728,
13
+ "grad_norm": 4.251254558563232,
14
  "learning_rate": 2e-05,
15
  "loss": 5.3201,
16
  "step": 1
 
18
  {
19
  "epoch": 0.0002717883674578728,
20
  "eval_loss": 5.817660331726074,
21
+ "eval_runtime": 740.7465,
22
+ "eval_samples_per_second": 6.275,
23
+ "eval_steps_per_second": 1.569,
24
  "step": 1
25
  },
26
  {
27
  "epoch": 0.0005435767349157456,
28
+ "grad_norm": 6.6031174659729,
29
  "learning_rate": 4e-05,
30
  "loss": 5.8911,
31
  "step": 2
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:248ce35ff18e493983381177f2ebda25f083ce99a178fa16cbf1b7fc2bec948d
3
  size 6776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:749d32b49d3872f7f415b6b04cd14255dda2b9c5197a883623274fec8966023e
3
  size 6776