SreyanG-NVIDIA commited on
Commit
e110d57
·
verified ·
1 Parent(s): 253048f

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +10 -2
app.py CHANGED
@@ -14,11 +14,19 @@ MODEL_BASE_THINK = os.path.join(MODEL_BASE_SINGLE, 'stage35')
14
 
15
  # model_single = llava.load(MODEL_BASE_SINGLE, model_base=None, devices=[0])
16
  model_single = llava.load(MODEL_BASE_SINGLE, model_base=None)
17
- model_single = model_single.to("cuda")
18
- model_single_copy = copy.deepcopy(model_single)
19
 
20
  generation_config_single = model_single.default_generation_config
21
 
 
 
 
 
 
 
 
 
22
  model_think = PeftModel.from_pretrained(
23
  model_single,
24
  MODEL_BASE_THINK,
 
14
 
15
  # model_single = llava.load(MODEL_BASE_SINGLE, model_base=None, devices=[0])
16
  model_single = llava.load(MODEL_BASE_SINGLE, model_base=None)
17
+ model_single = model_single.to("cuda")
18
+ model_single_copy = copy.deepcopy(model_single) # keep a copy of the original model for non-thinking mode
19
 
20
  generation_config_single = model_single.default_generation_config
21
 
22
+ non_lora_trainables = torch.load(
23
+ os.path.join(MODEL_BASE_THINK, "non_lora_trainables.bin"),
24
+ map_location="cpu",
25
+ )
26
+ non_lora_trainables = {
27
+ (k[6:] if k.startswith("model.") else k): v for k, v in non_lora_trainables.items()
28
+ }
29
+ model.load_state_dict(non_lora_trainables, strict=False)
30
  model_think = PeftModel.from_pretrained(
31
  model_single,
32
  MODEL_BASE_THINK,