rphrp1985 commited on
Commit
1b0ef2e
·
verified ·
1 Parent(s): 08206a7

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -1
app.py CHANGED
@@ -135,7 +135,8 @@ model = AutoModelForCausalLM.from_pretrained(
135
  MODEL_ID,
136
  device_map="auto",
137
  low_cpu_mem_usage=True,
138
- quantization_config=quantization_config,
 
139
  attn_implementation="flash_attention_2",
140
  )
141
 
 
135
  MODEL_ID,
136
  device_map="auto",
137
  low_cpu_mem_usage=True,
138
+ torch_dtype=torch.bfloat16,
139
+ # quantization_config=quantization_config,
140
  attn_implementation="flash_attention_2",
141
  )
142