rphrp1985 commited on
Commit
b91461d
·
verified ·
1 Parent(s): 014e805

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +3 -3
app.py CHANGED
@@ -31,7 +31,7 @@ from transformers import AutoModelForCausalLM, AutoTokenizer
31
 
32
  # model_id = "mistralai/Mistral-7B-v0.3"
33
 
34
- model_id = "CohereForAI/aya-23-35B"
35
 
36
 
37
  tokenizer = AutoTokenizer.from_pretrained(
@@ -46,9 +46,9 @@ with init_empty_weights():
46
  torch_dtype=torch.float16,
47
  # torch_dtype=torch.fl,
48
  # attn_implementation="flash_attention_2",
49
- # low_cpu_mem_usage=True,
50
  # llm_int8_enable_fp32_cpu_offload=True,
51
- # device_map='cuda',
52
 
53
  )
54
 
 
31
 
32
  # model_id = "mistralai/Mistral-7B-v0.3"
33
 
34
+ model_id = "CohereForAI/aya-23-8B"
35
 
36
 
37
  tokenizer = AutoTokenizer.from_pretrained(
 
46
  torch_dtype=torch.float16,
47
  # torch_dtype=torch.fl,
48
  # attn_implementation="flash_attention_2",
49
+ low_cpu_mem_usage=True,
50
  # llm_int8_enable_fp32_cpu_offload=True,
51
+ device_map='cuda',
52
 
53
  )
54