joshswartz commited on
Commit
165fa85
·
1 Parent(s): 3e8654a

Upload folder using huggingface_hub

Browse files
Files changed (3) hide show
  1. README.md +19 -0
  2. adapter_config.json +2 -2
  3. adapter_model.bin +1 -1
README.md CHANGED
@@ -217,4 +217,23 @@ The following `bitsandbytes` quantization config was used during training:
217
  ### Framework versions
218
 
219
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
220
  - PEFT 0.6.0
 
217
  ### Framework versions
218
 
219
 
220
+ - PEFT 0.6.0
221
+ ## Training procedure
222
+
223
+
224
+ The following `bitsandbytes` quantization config was used during training:
225
+ - quant_method: bitsandbytes
226
+ - load_in_8bit: False
227
+ - load_in_4bit: True
228
+ - llm_int8_threshold: 6.0
229
+ - llm_int8_skip_modules: None
230
+ - llm_int8_enable_fp32_cpu_offload: False
231
+ - llm_int8_has_fp16_weight: False
232
+ - bnb_4bit_quant_type: nf4
233
+ - bnb_4bit_use_double_quant: True
234
+ - bnb_4bit_compute_dtype: float16
235
+
236
+ ### Framework versions
237
+
238
+
239
  - PEFT 0.6.0
adapter_config.json CHANGED
@@ -16,11 +16,11 @@
16
  "rank_pattern": {},
17
  "revision": null,
18
  "target_modules": [
 
19
  "dense_h_to_4h",
20
  "lm_head",
21
- "dense",
22
  "query_key_value",
23
- "dense_4h_to_h"
24
  ],
25
  "task_type": "CAUSAL_LM"
26
  }
 
16
  "rank_pattern": {},
17
  "revision": null,
18
  "target_modules": [
19
+ "dense_4h_to_h",
20
  "dense_h_to_4h",
21
  "lm_head",
 
22
  "query_key_value",
23
+ "dense"
24
  ],
25
  "task_type": "CAUSAL_LM"
26
  }
adapter_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fe41197f64abcb667a3dc1505d4915f990797d7eb427211513fbf933a27ceb94
3
  size 214800210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9c700e1c9d62ce24314480f194c736371156f6900c09cb6c5a09d2c3b8c26146
3
  size 214800210