acezxn commited on
Commit
9571c8f
·
verified ·
1 Parent(s): ae6f891

End of training

Browse files
README.md CHANGED
@@ -35,10 +35,10 @@ This model was trained with SFT.
35
 
36
  ### Framework versions
37
 
38
- - TRL: 0.14.0
39
- - Transformers: 4.48.2
40
  - Pytorch: 2.6.0
41
- - Datasets: 3.2.0
42
  - Tokenizers: 0.21.0
43
 
44
  ## Citations
 
35
 
36
  ### Framework versions
37
 
38
+ - TRL: 0.15.2
39
+ - Transformers: 4.49.0
40
  - Pytorch: 2.6.0
41
+ - Datasets: 3.3.2
42
  - Tokenizers: 0.21.0
43
 
44
  ## Citations
adapter_config.json CHANGED
@@ -23,13 +23,13 @@
23
  "rank_pattern": {},
24
  "revision": null,
25
  "target_modules": [
 
26
  "v_proj",
 
27
  "down_proj",
28
- "k_proj",
29
  "up_proj",
30
- "gate_proj",
31
- "q_proj",
32
- "o_proj"
33
  ],
34
  "task_type": "CAUSAL_LM",
35
  "use_dora": false,
 
23
  "rank_pattern": {},
24
  "revision": null,
25
  "target_modules": [
26
+ "k_proj",
27
  "v_proj",
28
+ "q_proj",
29
  "down_proj",
 
30
  "up_proj",
31
+ "o_proj",
32
+ "gate_proj"
 
33
  ],
34
  "task_type": "CAUSAL_LM",
35
  "use_dora": false,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:65b5dc25a48f1723ea790f54d5ba3ecbbffdf7273ef9a138abf21de61c9987d7
3
  size 194563400
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0c1dedb72088a73a439cfe44734f2115f5ab27e2c24ab48682efc1de990d8c59
3
  size 194563400
runs/Feb15_22-30-26_ea6e1e24e8ea/events.out.tfevents.1739658631.ea6e1e24e8ea.190592.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:babeeae9699d20246d3c41fa4f992b1be263d35708176b84f6e96640b966ad01
3
+ size 6520
runs/Feb18_04-06-24_ea6e1e24e8ea/events.out.tfevents.1739851588.ea6e1e24e8ea.682413.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f0ab2be7dea5eec2ebba129cb5c2ae6c65d94b3fb1f3aa9ca7485144c5e1372
3
+ size 4184
runs/Feb18_04-08-29_ea6e1e24e8ea/events.out.tfevents.1739851713.ea6e1e24e8ea.683084.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:44a41353e30c2a88e7428d0cac08838d3bc788f57874593588158d4f00876897
3
+ size 4184
runs/Feb18_04-10-40_ea6e1e24e8ea/events.out.tfevents.1739851843.ea6e1e24e8ea.683763.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:53c7b4700679a64d678a9748e61d15c7065422b509e7d606d81f30a669e3fedd
3
+ size 74577
runs/Mar13_03-21-28_1c541e6483bb/events.out.tfevents.1741836092.1c541e6483bb.6671.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:55c209a95d598c26ebd3f3b35604ebfdad9c68a1b399bd372cc8c690d277d7c9
3
+ size 74609
runs/Mar13_03-44-30_1c541e6483bb/events.out.tfevents.1741837472.1c541e6483bb.11177.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7a338969601f123f5e8a33f2d62d1b28078c5ac7b080723c33c74ea1b6e0f6b2
3
+ size 33491
tokenizer_config.json CHANGED
@@ -2061,7 +2061,7 @@
2061
  ],
2062
  "model_max_length": 131072,
2063
  "pad_token": "<|finetune_right_pad_id|>",
2064
- "padding_side": "left",
2065
- "tokenizer_class": "PreTrainedTokenizerFast",
2066
  "unk_token": null
2067
  }
 
2061
  ],
2062
  "model_max_length": 131072,
2063
  "pad_token": "<|finetune_right_pad_id|>",
2064
+ "padding_side": "right",
2065
+ "tokenizer_class": "PreTrainedTokenizer",
2066
  "unk_token": null
2067
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1328e5a15bc595f9802adc522b62ad33513a8ebc15081fd3148d104d1e91bc21
3
- size 5624
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bb18cffe9997604e0e9fdfdadbf0bc70f88b93ae383f6fba5f372cf14b4f9e48
3
+ size 5688