rphrp1985 commited on
Commit
add0b80
·
verified ·
1 Parent(s): 6d1ecc6

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +1 -1
app.py CHANGED
@@ -127,7 +127,7 @@ CONTEXT_LENGTH = 16000
127
 
128
  device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
129
  quantization_config = BitsAndBytesConfig(
130
- load_in_8bit=True,
131
  bnb_4bit_compute_dtype=torch.bfloat16
132
  )
133
  tokenizer = AutoTokenizer.from_pretrained(MODEL_ID)
 
127
 
128
  device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
129
  quantization_config = BitsAndBytesConfig(
130
+ load_in_4bit=True,
131
  bnb_4bit_compute_dtype=torch.bfloat16
132
  )
133
  tokenizer = AutoTokenizer.from_pretrained(MODEL_ID)