aifeifei798 commited on
Commit
20b9178
·
verified ·
1 Parent(s): 035246c

Update bit4-chat.py

Browse files
Files changed (1) hide show
  1. bit4-chat.py +1 -1
bit4-chat.py CHANGED
@@ -10,7 +10,7 @@ quantization_config = BitsAndBytesConfig(
10
  )
11
 
12
  # Define the model name and path for the quantized model
13
- model_name = "nvidia/Llama-3.1-Nemotron-Nano-8B-v1-bnb-4bit"
14
 
15
  # Load the quantized model with the specified configuration
16
  model = AutoModelForCausalLM.from_pretrained(
 
10
  )
11
 
12
  # Define the model name and path for the quantized model
13
+ model_name = "./Llama-3.1-Nemotron-Nano-8B-v1-bnb-4bit"
14
 
15
  # Load the quantized model with the specified configuration
16
  model = AutoModelForCausalLM.from_pretrained(