Update app.py
Browse files
app.py
CHANGED
@@ -127,7 +127,7 @@ CONTEXT_LENGTH = 16000
|
|
127 |
|
128 |
device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
|
129 |
quantization_config = BitsAndBytesConfig(
|
130 |
-
|
131 |
bnb_4bit_compute_dtype=torch.bfloat16
|
132 |
)
|
133 |
tokenizer = AutoTokenizer.from_pretrained(MODEL_ID)
|
|
|
127 |
|
128 |
device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
|
129 |
quantization_config = BitsAndBytesConfig(
|
130 |
+
load_in_4bit=True,
|
131 |
bnb_4bit_compute_dtype=torch.bfloat16
|
132 |
)
|
133 |
tokenizer = AutoTokenizer.from_pretrained(MODEL_ID)
|