Update app.py
Browse files
app.py
CHANGED
@@ -135,7 +135,8 @@ model = AutoModelForCausalLM.from_pretrained(
|
|
135 |
MODEL_ID,
|
136 |
device_map="auto",
|
137 |
low_cpu_mem_usage=True,
|
138 |
-
|
|
|
139 |
attn_implementation="flash_attention_2",
|
140 |
)
|
141 |
|
|
|
135 |
MODEL_ID,
|
136 |
device_map="auto",
|
137 |
low_cpu_mem_usage=True,
|
138 |
+
torch_dtype=torch.bfloat16,
|
139 |
+
# quantization_config=quantization_config,
|
140 |
attn_implementation="flash_attention_2",
|
141 |
)
|
142 |
|