Safetensors
qwen3
ehartford commited on
Commit
d191028
·
verified ·
1 Parent(s): beb3696

Update stage1_v2.py

Browse files
Files changed (1) hide show
  1. stage1_v2.py +1 -1
stage1_v2.py CHANGED
@@ -46,7 +46,7 @@ HEAD_DIM = 128
46
  DELTA_HIDDEN = TGT_HIDDEN_SIZE - SRC_HIDDEN_SIZE
47
  DELTA_INTERMEDIATE = TGT_INTERMEDIATE_SIZE - SRC_INTERMEDIATE_SIZE
48
 
49
- OUTPUT_DIR = "./Qwen3-32B-to-72B-Stage1-v2-sharted"
50
 
51
  # GPU configuration
52
  NUM_GPUS = 8
 
46
  DELTA_HIDDEN = TGT_HIDDEN_SIZE - SRC_HIDDEN_SIZE
47
  DELTA_INTERMEDIATE = TGT_INTERMEDIATE_SIZE - SRC_INTERMEDIATE_SIZE
48
 
49
+ OUTPUT_DIR = "./Qwen3-58B-Embiggened"
50
 
51
  # GPU configuration
52
  NUM_GPUS = 8