jwnder commited on
Commit
74ade01
·
verified ·
1 Parent(s): 998a974

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +2 -14
README.md CHANGED
@@ -25,20 +25,8 @@ model_name = "jwnder/core42_jais-13b-chat-bnb-4bit"
25
  import warnings
26
  warnings.filterwarnings('ignore')
27
 
28
- bnb_config = BitsAndBytesConfig(
29
- load_in_4bit=True,
30
- bnb_4bit_quant_type="nf4",
31
- bnb_4bit_compute_dtype=torch.bfloat16,
32
- bnb_4bit_use_double_quant=True,
33
- llm_int8_enable_fp32_cpu_offload=True
34
- )
35
- tokenizer = AutoTokenizer.from_pretrained(model_name, trust_remote_code=True)
36
- model = AutoModelForCausalLM.from_pretrained(
37
- model_name,
38
- quantization_config=bnb_config,
39
- device_map="auto",
40
- trust_remote_code=True
41
- )
42
 
43
  inputs = tokenizer("Testing LLM!", return_tensors="pt")
44
  start = datetime.now()
 
25
  import warnings
26
  warnings.filterwarnings('ignore')
27
 
28
+ tokenizer = AutoTokenizer.from_pretrained(model_input_folder, trust_remote_code=True)
29
+ model = AutoModelForCausalLM.from_pretrained(model_input_folder, trust_remote_code=True)
 
 
 
 
 
 
 
 
 
 
 
 
30
 
31
  inputs = tokenizer("Testing LLM!", return_tensors="pt")
32
  start = datetime.now()